13578 lines
362 KiB
JSON
13578 lines
362 KiB
JSON
{
|
|
"meta": {
|
|
"generated_at": "2026-04-29T05:45:18Z",
|
|
"system_info": {
|
|
"distro": "Fedora Linux 43 (Workstation Edition)",
|
|
"kernel": "6.19.9-200.fc43.x86_64",
|
|
"linux_firmware": "linux-firmware-20260309-1.fc43.noarch",
|
|
"timestamp": "10 Apr 2026"
|
|
},
|
|
"llamacpp_builds": [
|
|
{
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
},
|
|
{
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
},
|
|
{
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
],
|
|
"environments": [
|
|
"rocm-7_2",
|
|
"rocm-7_2_2",
|
|
"rocm-7_2_2-pr21344",
|
|
"rocm6_4_4",
|
|
"rocm7-nightlies",
|
|
"vulkan_amdvlk",
|
|
"vulkan_radv"
|
|
],
|
|
"notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second"
|
|
},
|
|
"runs": [
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 72.06,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 16.76,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.08,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 77.83,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.1,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.4,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.57,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.06,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 18.34,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.06,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 123.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 123.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 46.91,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 7.32,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 403.45,
|
|
"tps_std": 2.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 87.65,
|
|
"tps_std": 0.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 87.91,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 392.81,
|
|
"tps_std": 1.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 94.55,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.89,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 400.57,
|
|
"tps_std": 4.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 86.01,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.86,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 114.94,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.48,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 10.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 326.36,
|
|
"tps_std": 4.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.5,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 102.0,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.82,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1058.1,
|
|
"tps_std": 2.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 33.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 91.21,
|
|
"tps_std": 1.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.62,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 889.16,
|
|
"tps_std": 36.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 32.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 91.01,
|
|
"tps_std": 1.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 903.01,
|
|
"tps_std": 2.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 99.7,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 888.7,
|
|
"tps_std": 38.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 32.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 89.53,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 499.74,
|
|
"tps_std": 1.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 39.02,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 875.8,
|
|
"tps_std": 2.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 40.19,
|
|
"tps_std": 1.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 134.1,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.18,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 356.93,
|
|
"tps_std": 1.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.97,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 65.86,
|
|
"tps_std": 0.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.1,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 236.39,
|
|
"tps_std": 1.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.64,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 64.53,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.04,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 236.56,
|
|
"tps_std": 1.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 77.34,
|
|
"tps_std": 1.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.54,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 225.65,
|
|
"tps_std": 0.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.44,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 64.1,
|
|
"tps_std": 0.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.35,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 202.08,
|
|
"tps_std": 0.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.94,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 31.48,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.27,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 231.25,
|
|
"tps_std": 0.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.7,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 32.0,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.47,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 87.2,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 245.87,
|
|
"tps_std": 1.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.72,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 81.2,
|
|
"tps_std": 1.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.69,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 238.13,
|
|
"tps_std": 1.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.54,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 61.41,
|
|
"tps_std": 0.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.64,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 203.65,
|
|
"tps_std": 1.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.07,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 31.64,
|
|
"tps_std": 0.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 230.72,
|
|
"tps_std": 8.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.48,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 32.06,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.12,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 745.5,
|
|
"tps_std": 9.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 164.19,
|
|
"tps_std": 1.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 732.09,
|
|
"tps_std": 2.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 182.01,
|
|
"tps_std": 2.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 716.84,
|
|
"tps_std": 2.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.12,
|
|
"tps_std": 0.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 726.92,
|
|
"tps_std": 2.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 162.4,
|
|
"tps_std": 0.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 14.0,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 14.0,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 164.2,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 7.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 72.41,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 333.46,
|
|
"tps_std": 1.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.99,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 307.47,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.6,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 267.67,
|
|
"tps_std": 1.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.18,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 304.86,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.79,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 261.51,
|
|
"tps_std": 1.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 323.83,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.34,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 232.54,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 284.15,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.34,
|
|
"tps_std": 0.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 138.78,
|
|
"tps_std": 0.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.45,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 104.96,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 13.66,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 191.97,
|
|
"tps_std": 8.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.7,
|
|
"tps_std": 0.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 185.9,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.21,
|
|
"tps_std": 0.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1498.5,
|
|
"tps_std": 6.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.29,
|
|
"tps_std": 0.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 213.71,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.47,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1149.95,
|
|
"tps_std": 8.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 67.57,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 194.74,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.36,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1167.77,
|
|
"tps_std": 7.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 65.06,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 291.69,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.81,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1185.86,
|
|
"tps_std": 2.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.95,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 203.21,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.77,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 882.68,
|
|
"tps_std": 3.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 80.48,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 111.69,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.03,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1145.07,
|
|
"tps_std": 8.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 82.16,
|
|
"tps_std": 3.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 194.38,
|
|
"tps_std": 0.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 37.09,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 418.75,
|
|
"tps_std": 3.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.62,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 207.29,
|
|
"tps_std": 0.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.34,
|
|
"tps_std": 2.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 314.59,
|
|
"tps_std": 2.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.96,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 235.56,
|
|
"tps_std": 9.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.82,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 316.73,
|
|
"tps_std": 1.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.86,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 275.81,
|
|
"tps_std": 1.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.9,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 318.17,
|
|
"tps_std": 2.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.57,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 223.61,
|
|
"tps_std": 0.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.32,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 182.98,
|
|
"tps_std": 1.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 102.84,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.77,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 241.15,
|
|
"tps_std": 7.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.75,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 202.99,
|
|
"tps_std": 0.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.09,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 513.08,
|
|
"tps_std": 3.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.46,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 379.44,
|
|
"tps_std": 1.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.65,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 509.14,
|
|
"tps_std": 3.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 391.47,
|
|
"tps_std": 0.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.88,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 538.42,
|
|
"tps_std": 12.9,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 412.11,
|
|
"tps_std": 0.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.59,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "load",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 35.0,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "load",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 35.0,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 122.43,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 11.55,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 98.18,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.94,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 316.59,
|
|
"tps_std": 1.87,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.8,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 267.07,
|
|
"tps_std": 0.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.6-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.37,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1359.62,
|
|
"tps_std": 5.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 48.34,
|
|
"tps_std": 0.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 670.26,
|
|
"tps_std": 1.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.42,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1089.21,
|
|
"tps_std": 5.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 49.27,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 703.58,
|
|
"tps_std": 0.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 41.08,
|
|
"tps_std": 0.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1067.33,
|
|
"tps_std": 6.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 48.23,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 769.99,
|
|
"tps_std": 2.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 41.91,
|
|
"tps_std": 0.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1091.62,
|
|
"tps_std": 10.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 49.1,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 664.89,
|
|
"tps_std": 1.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 42.73,
|
|
"tps_std": 0.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 663.94,
|
|
"tps_std": 2.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.13,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 292.49,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 43.97,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1045.16,
|
|
"tps_std": 5.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.82,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 682.8,
|
|
"tps_std": 1.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 48.77,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.81,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1222.77,
|
|
"tps_std": 2.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 43.72,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 653.49,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 37.21,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1043.12,
|
|
"tps_std": 46.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.53,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 544.04,
|
|
"tps_std": 1.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 37.7,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1049.22,
|
|
"tps_std": 7.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 43.1,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 758.76,
|
|
"tps_std": 0.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.7,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1036.89,
|
|
"tps_std": 9.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 510.38,
|
|
"tps_std": 2.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.18,
|
|
"tps_std": 1.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 576.25,
|
|
"tps_std": 2.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.25,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 273.77,
|
|
"tps_std": 0.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.71,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 893.79,
|
|
"tps_std": 4.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.05,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 610.84,
|
|
"tps_std": 1.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.67,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 35.8,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 836.74,
|
|
"tps_std": 6.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.95,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 619.85,
|
|
"tps_std": 6.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.38,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 823.65,
|
|
"tps_std": 83.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 628.14,
|
|
"tps_std": 5.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.15,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 839.13,
|
|
"tps_std": 7.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 20.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 646.67,
|
|
"tps_std": 11.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.86,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 844.42,
|
|
"tps_std": 19.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 546.66,
|
|
"tps_std": 5.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.11,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 117.96,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.18,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 58.94,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.26,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 376.52,
|
|
"tps_std": 7.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.74,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 351.87,
|
|
"tps_std": 1.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 13.71,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1608.01,
|
|
"tps_std": 5.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 47.13,
|
|
"tps_std": 0.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 689.3,
|
|
"tps_std": 12.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 37.14,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1299.9,
|
|
"tps_std": 11.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.59,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 693.48,
|
|
"tps_std": 4.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.76,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1288.38,
|
|
"tps_std": 10.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.58,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 721.84,
|
|
"tps_std": 10.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.17,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1219.74,
|
|
"tps_std": 15.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.57,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 600.42,
|
|
"tps_std": 7.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.88,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 720.78,
|
|
"tps_std": 2.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.21,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 100.79,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 35.41,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1213.78,
|
|
"tps_std": 7.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 53.04,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 638.76,
|
|
"tps_std": 1.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.93,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1524.44,
|
|
"tps_std": 7.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.68,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 689.36,
|
|
"tps_std": 8.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.67,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1272.69,
|
|
"tps_std": 74.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.31,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 696.25,
|
|
"tps_std": 7.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.95,
|
|
"tps_std": 0.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1303.32,
|
|
"tps_std": 8.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 38.81,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 727.92,
|
|
"tps_std": 8.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.52,
|
|
"tps_std": 0.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1294.4,
|
|
"tps_std": 31.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 596.78,
|
|
"tps_std": 7.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 589.2,
|
|
"tps_std": 1.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 43.18,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 97.7,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.82,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 944.96,
|
|
"tps_std": 19.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 43.58,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 579.88,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 35.52,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 380.58,
|
|
"tps_std": 1.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 150.63,
|
|
"tps_std": 1.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.17,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 377.93,
|
|
"tps_std": 2.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 153.11,
|
|
"tps_std": 1.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.18,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 360.84,
|
|
"tps_std": 1.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 154.86,
|
|
"tps_std": 2.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.14,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 373.84,
|
|
"tps_std": 0.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 139.53,
|
|
"tps_std": 1.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.16,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 31.0,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 31.0,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 79.53,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 60.29,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 293.27,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 136.84,
|
|
"tps_std": 1.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 310.54,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 140.71,
|
|
"tps_std": 1.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.11,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 309.22,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 143.91,
|
|
"tps_std": 1.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 315.72,
|
|
"tps_std": 0.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 130.8,
|
|
"tps_std": 1.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 69.12,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 31.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 244.46,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 11.02,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 124.32,
|
|
"tps_std": 1.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 282.42,
|
|
"tps_std": 0.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 132.6,
|
|
"tps_std": 1.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 308.17,
|
|
"tps_std": 0.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 138.85,
|
|
"tps_std": 1.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 303.4,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 141.37,
|
|
"tps_std": 1.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.18,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 319.75,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 128.0,
|
|
"tps_std": 1.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 72.26,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 31.0,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 209.2,
|
|
"tps_std": 6.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 112.72,
|
|
"tps_std": 1.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 945.82,
|
|
"tps_std": 60.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.25,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 311.38,
|
|
"tps_std": 1.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.94,
|
|
"tps_std": 7.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 634.64,
|
|
"tps_std": 3.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.7,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 304.96,
|
|
"tps_std": 1.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 35.84,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 648.77,
|
|
"tps_std": 4.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 49.76,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 439.58,
|
|
"tps_std": 0.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.77,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 641.05,
|
|
"tps_std": 2.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 305.81,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.03,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 575.01,
|
|
"tps_std": 3.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.2,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 214.22,
|
|
"tps_std": 0.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.54,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 635.12,
|
|
"tps_std": 4.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 56.31,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 290.19,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 42.28,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2029.48,
|
|
"tps_std": 6.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.53,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 494.19,
|
|
"tps_std": 1.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1631.69,
|
|
"tps_std": 17.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.53,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 490.56,
|
|
"tps_std": 2.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.69,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1694.78,
|
|
"tps_std": 17.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.19,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 730.43,
|
|
"tps_std": 1.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.22,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1635.73,
|
|
"tps_std": 10.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.47,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 493.84,
|
|
"tps_std": 1.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 52.05,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1306.44,
|
|
"tps_std": 9.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.63,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 365.33,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 49.83,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1574.45,
|
|
"tps_std": 16.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 79.03,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 545.65,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 60.7,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1512.85,
|
|
"tps_std": 4.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.54,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_2-pr21344__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 163.39,
|
|
"tps_std": 1.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_2-pr21344",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2-pr21344",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_2-pr21344__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "7957de9dc",
|
|
"number": "8645"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1542.98,
|
|
"tps_std": 7.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.52,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 162.64,
|
|
"tps_std": 0.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f53577432",
|
|
"number": "8942"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1524.35,
|
|
"tps_std": 2.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.78,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 196.44,
|
|
"tps_std": 1.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1513.21,
|
|
"tps_std": 2.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.41,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 189.28,
|
|
"tps_std": 0.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 326.38,
|
|
"tps_std": 0.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.44,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 145.14,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1311.79,
|
|
"tps_std": 0.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.59,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 210.35,
|
|
"tps_std": 0.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.53,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
}
|
|
]
|
|
} |