19281 lines
520 KiB
JSON
19281 lines
520 KiB
JSON
{
|
|
"meta": {
|
|
"generated_at": "2026-03-30T06:55:07Z",
|
|
"system_info": {
|
|
"distro": "Fedora Linux 43 (Workstation Edition)",
|
|
"kernel": "6.19.9-200.fc43.x86_64",
|
|
"linux_firmware": "linux-firmware-20260309-1.fc43.noarch",
|
|
"timestamp": "29 Mar 2026"
|
|
},
|
|
"llamacpp_builds": [
|
|
{
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
},
|
|
{
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
],
|
|
"environments": [
|
|
"rocm-7_2",
|
|
"rocm-7_2-hblt0",
|
|
"rocm6_4_4",
|
|
"rocm6_4_4-hblt0",
|
|
"rocm7-nightlies",
|
|
"rocm7-nightlies-hblt0",
|
|
"vulkan_amdvlk",
|
|
"vulkan_radv"
|
|
],
|
|
"notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second"
|
|
},
|
|
"runs": [
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.37,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.07,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.3,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.08,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.37,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.56,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.63,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.58,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.08,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 80.49,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 21.15,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.07,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.97,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 21.17,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 123.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 123.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 47.2,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 7.39,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 435.72,
|
|
"tps_std": 2.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 87.93,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 403.83,
|
|
"tps_std": 1.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 87.49,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.33,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 393.19,
|
|
"tps_std": 1.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 94.74,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.06,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 393.15,
|
|
"tps_std": 2.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.11,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 94.55,
|
|
"tps_std": 0.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 476.23,
|
|
"tps_std": 2.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 86.79,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 401.13,
|
|
"tps_std": 5.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 85.92,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.3,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 114.88,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 10.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 342.11,
|
|
"tps_std": 5.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.48,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 102.93,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.82,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 905.79,
|
|
"tps_std": 2.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 32.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 91.97,
|
|
"tps_std": 0.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.58,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 893.68,
|
|
"tps_std": 28.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 33.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 91.83,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 903.39,
|
|
"tps_std": 1.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 31.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 99.84,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 906.25,
|
|
"tps_std": 1.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 32.57,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 100.07,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 902.85,
|
|
"tps_std": 59.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 33.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 89.75,
|
|
"tps_std": 0.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 906.42,
|
|
"tps_std": 2.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 33.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 89.99,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 499.98,
|
|
"tps_std": 1.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 39.01,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 853.46,
|
|
"tps_std": 6.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 40.38,
|
|
"tps_std": 1.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 133.27,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.17,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 673.71,
|
|
"tps_std": 1.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.35,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 160.3,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 748.37,
|
|
"tps_std": 4.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 165.11,
|
|
"tps_std": 1.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 706.16,
|
|
"tps_std": 3.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.61,
|
|
"tps_std": 1.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 710.61,
|
|
"tps_std": 4.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 161.22,
|
|
"tps_std": 2.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 881.45,
|
|
"tps_std": 3.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 213.5,
|
|
"tps_std": 0.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 735.98,
|
|
"tps_std": 5.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 205.29,
|
|
"tps_std": 0.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 14.0,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 14.0,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 166.51,
|
|
"tps_std": 0.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 7.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 72.65,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 259.71,
|
|
"tps_std": 1.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 302.29,
|
|
"tps_std": 0.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.58,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 263.95,
|
|
"tps_std": 1.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 305.52,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.59,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 260.98,
|
|
"tps_std": 1.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 324.69,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.38,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 262.3,
|
|
"tps_std": 1.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 324.11,
|
|
"tps_std": 0.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.45,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 228.5,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 284.43,
|
|
"tps_std": 0.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.76,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 236.84,
|
|
"tps_std": 1.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.04,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 290.04,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.76,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 140.84,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 13.97,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 106.21,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 13.21,
|
|
"tps_std": 0.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 190.66,
|
|
"tps_std": 7.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.41,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 191.12,
|
|
"tps_std": 0.46,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 13.85,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 194.62,
|
|
"tps_std": 1.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 49.93,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.41,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 194.32,
|
|
"tps_std": 1.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.8,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 49.97,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.63,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 197.89,
|
|
"tps_std": 1.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.96,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 70.32,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.22,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 198.04,
|
|
"tps_std": 1.9,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 13.11,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 70.27,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.02,
|
|
"tps_std": 0.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 197.46,
|
|
"tps_std": 1.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 48.93,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.34,
|
|
"tps_std": 0.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 194.0,
|
|
"tps_std": 1.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 49.33,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.46,
|
|
"tps_std": 0.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 106.76,
|
|
"tps_std": 0.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 26.54,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.57,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 158.81,
|
|
"tps_std": 2.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.16,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 28.25,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.49,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 474.42,
|
|
"tps_std": 2.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 189.58,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.53,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 479.78,
|
|
"tps_std": 2.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 180.26,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 556.96,
|
|
"tps_std": 2.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.05,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 238.1,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.26,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 556.8,
|
|
"tps_std": 4.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 237.85,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.46,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 503.77,
|
|
"tps_std": 3.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 182.59,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.25,
|
|
"tps_std": 1.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 482.99,
|
|
"tps_std": 0.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 175.78,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 171.39,
|
|
"tps_std": 0.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.48,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 73.62,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 369.06,
|
|
"tps_std": 2.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.38,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 140.81,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 994.33,
|
|
"tps_std": 11.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.87,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 209.15,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.88,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 994.22,
|
|
"tps_std": 10.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.84,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 208.93,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.9,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1009.37,
|
|
"tps_std": 9.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 53.13,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 285.49,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.53,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1012.69,
|
|
"tps_std": 9.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 54.94,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 285.25,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.5,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1023.24,
|
|
"tps_std": 11.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 56.92,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 206.37,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.69,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1012.11,
|
|
"tps_std": 7.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 56.92,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 205.56,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.62,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 828.53,
|
|
"tps_std": 4.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 63.31,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 110.5,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.87,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1145.66,
|
|
"tps_std": 9.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.15,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 193.03,
|
|
"tps_std": 0.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.02,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1149.31,
|
|
"tps_std": 13.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 67.72,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 212.38,
|
|
"tps_std": 0.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.49,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1149.83,
|
|
"tps_std": 7.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.05,
|
|
"tps_std": 0.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 212.45,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.52,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1170.01,
|
|
"tps_std": 7.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 65.12,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 291.28,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.65,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1167.76,
|
|
"tps_std": 7.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 64.97,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 290.12,
|
|
"tps_std": 2.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.65,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1178.27,
|
|
"tps_std": 10.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.46,
|
|
"tps_std": 0.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 209.14,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.83,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1172.23,
|
|
"tps_std": 12.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.65,
|
|
"tps_std": 0.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 209.05,
|
|
"tps_std": 0.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.76,
|
|
"tps_std": 0.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 882.98,
|
|
"tps_std": 3.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 80.84,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 111.65,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.03,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1290.5,
|
|
"tps_std": 7.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 83.79,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 194.26,
|
|
"tps_std": 0.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 37.04,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 613.58,
|
|
"tps_std": 2.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 447.94,
|
|
"tps_std": 2.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.06,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 583.48,
|
|
"tps_std": 105.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.85,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 439.93,
|
|
"tps_std": 32.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 627.46,
|
|
"tps_std": 3.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.02,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 527.78,
|
|
"tps_std": 1.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 623.64,
|
|
"tps_std": 17.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.16,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 512.14,
|
|
"tps_std": 3.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.33,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 622.47,
|
|
"tps_std": 8.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 443.0,
|
|
"tps_std": 30.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.97,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 600.08,
|
|
"tps_std": 13.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 457.86,
|
|
"tps_std": 1.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 27.08,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 396.36,
|
|
"tps_std": 1.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.9,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 208.44,
|
|
"tps_std": 0.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.08,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 500.88,
|
|
"tps_std": 3.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 31.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 420.42,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.05,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.94,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 629.03,
|
|
"tps_std": 5.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 31.37,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 439.65,
|
|
"tps_std": 0.69,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 27.25,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 648.58,
|
|
"tps_std": 5.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.86,
|
|
"tps_std": 0.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 457.6,
|
|
"tps_std": 1.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 27.22,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 634.72,
|
|
"tps_std": 6.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.9,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 511.83,
|
|
"tps_std": 7.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 27.45,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 632.78,
|
|
"tps_std": 59.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.53,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 507.17,
|
|
"tps_std": 2.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 27.44,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 621.13,
|
|
"tps_std": 82.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 31.52,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 467.56,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.26,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 661.07,
|
|
"tps_std": 5.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 31.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 432.86,
|
|
"tps_std": 0.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.2,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 436.5,
|
|
"tps_std": 7.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 34.72,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 218.02,
|
|
"tps_std": 0.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.5,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 587.86,
|
|
"tps_std": 37.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 36.28,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 453.76,
|
|
"tps_std": 0.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.67,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 86.68,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 305.11,
|
|
"tps_std": 1.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 246.59,
|
|
"tps_std": 0.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.49,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 313.18,
|
|
"tps_std": 2.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 243.74,
|
|
"tps_std": 1.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.51,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 311.68,
|
|
"tps_std": 1.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.77,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 273.72,
|
|
"tps_std": 1.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.91,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 306.06,
|
|
"tps_std": 2.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.25,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 270.84,
|
|
"tps_std": 0.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.98,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 314.27,
|
|
"tps_std": 4.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 235.12,
|
|
"tps_std": 5.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.36,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 310.73,
|
|
"tps_std": 1.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.61,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 241.56,
|
|
"tps_std": 5.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.35,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 183.05,
|
|
"tps_std": 1.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 102.85,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.76,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 239.56,
|
|
"tps_std": 7.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.68,
|
|
"tps_std": 0.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 203.34,
|
|
"tps_std": 0.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.09,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 508.43,
|
|
"tps_std": 3.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 423.84,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.64,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 512.17,
|
|
"tps_std": 3.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 382.51,
|
|
"tps_std": 1.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.63,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 544.11,
|
|
"tps_std": 3.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.4,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 407.19,
|
|
"tps_std": 1.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.59,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 550.28,
|
|
"tps_std": 3.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.23,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 405.13,
|
|
"tps_std": 1.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.72,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 541.57,
|
|
"tps_std": 11.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 441.64,
|
|
"tps_std": 9.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 22.18,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 509.57,
|
|
"tps_std": 8.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 379.36,
|
|
"tps_std": 1.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 22.2,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 122.56,
|
|
"tps_std": 0.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 11.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 97.32,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 309.96,
|
|
"tps_std": 4.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.79,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 258.85,
|
|
"tps_std": 0.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.39,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1071.38,
|
|
"tps_std": 11.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 47.78,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 669.09,
|
|
"tps_std": 1.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.19,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1093.96,
|
|
"tps_std": 6.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 47.95,
|
|
"tps_std": 0.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 661.4,
|
|
"tps_std": 0.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.13,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1079.44,
|
|
"tps_std": 6.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.46,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 762.29,
|
|
"tps_std": 2.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.46,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1082.35,
|
|
"tps_std": 6.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.48,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 777.89,
|
|
"tps_std": 1.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.24,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1092.86,
|
|
"tps_std": 9.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 48.16,
|
|
"tps_std": 0.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 655.39,
|
|
"tps_std": 2.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 41.9,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1113.86,
|
|
"tps_std": 6.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 48.1,
|
|
"tps_std": 0.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 655.89,
|
|
"tps_std": 1.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 41.98,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 661.63,
|
|
"tps_std": 3.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.16,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 288.86,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 44.24,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1013.4,
|
|
"tps_std": 39.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 59.13,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 673.55,
|
|
"tps_std": 0.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 48.93,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 854.2,
|
|
"tps_std": 6.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 392.45,
|
|
"tps_std": 16.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 877.69,
|
|
"tps_std": 1.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 387.73,
|
|
"tps_std": 18.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 869.53,
|
|
"tps_std": 1.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 260.25,
|
|
"tps_std": 4.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 870.35,
|
|
"tps_std": 1.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 263.85,
|
|
"tps_std": 5.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 892.78,
|
|
"tps_std": 1.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 441.92,
|
|
"tps_std": 38.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 895.09,
|
|
"tps_std": 0.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 449.4,
|
|
"tps_std": 28.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 122.72,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.31,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 107.34,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 513.78,
|
|
"tps_std": 16.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.07,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 258.63,
|
|
"tps_std": 1.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 324.28,
|
|
"tps_std": 1.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.64,
|
|
"tps_std": 2.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 455.07,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 188.26,
|
|
"tps_std": 1.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 426.08,
|
|
"tps_std": 0.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 209.69,
|
|
"tps_std": 3.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.68,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 440.33,
|
|
"tps_std": 0.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 202.85,
|
|
"tps_std": 0.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.69,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 466.09,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 182.83,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.68,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 452.21,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 181.81,
|
|
"tps_std": 3.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 91.65,
|
|
"tps_std": 0.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 81.52,
|
|
"tps_std": 0.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2700.94,
|
|
"tps_std": 1.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 77.69,
|
|
"tps_std": 0.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1564.27,
|
|
"tps_std": 18.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.8,
|
|
"tps_std": 0.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2691.0,
|
|
"tps_std": 4.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 77.86,
|
|
"tps_std": 0.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1563.05,
|
|
"tps_std": 19.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.95,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2719.77,
|
|
"tps_std": 6.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.32,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1687.79,
|
|
"tps_std": 33.87,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 54.09,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2713.06,
|
|
"tps_std": 9.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.85,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1681.29,
|
|
"tps_std": 17.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 54.11,
|
|
"tps_std": 0.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2666.49,
|
|
"tps_std": 3.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.31,
|
|
"tps_std": 0.89,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1530.18,
|
|
"tps_std": 18.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.72,
|
|
"tps_std": 0.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2674.53,
|
|
"tps_std": 5.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.93,
|
|
"tps_std": 0.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1534.58,
|
|
"tps_std": 20.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.65,
|
|
"tps_std": 0.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 647.4,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 79.07,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 455.63,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 54.86,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2479.97,
|
|
"tps_std": 41.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 87.24,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1759.67,
|
|
"tps_std": 6.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 64.91,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 631.59,
|
|
"tps_std": 4.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.91,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 303.63,
|
|
"tps_std": 0.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.07,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 610.41,
|
|
"tps_std": 53.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.34,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 302.82,
|
|
"tps_std": 1.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.12,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 648.44,
|
|
"tps_std": 6.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 49.85,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 442.64,
|
|
"tps_std": 0.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.69,
|
|
"tps_std": 0.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 639.43,
|
|
"tps_std": 31.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.99,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 438.75,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.75,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 596.69,
|
|
"tps_std": 97.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 308.13,
|
|
"tps_std": 1.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 35.43,
|
|
"tps_std": 8.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 641.07,
|
|
"tps_std": 11.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 314.5,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.04,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 576.81,
|
|
"tps_std": 2.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.18,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 213.74,
|
|
"tps_std": 0.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.52,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 633.21,
|
|
"tps_std": 13.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 56.15,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 287.49,
|
|
"tps_std": 1.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 42.67,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1638.53,
|
|
"tps_std": 13.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.67,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 488.89,
|
|
"tps_std": 0.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.91,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1631.29,
|
|
"tps_std": 15.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.62,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 492.09,
|
|
"tps_std": 1.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.93,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1691.01,
|
|
"tps_std": 16.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.07,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 730.11,
|
|
"tps_std": 1.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.02,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1690.3,
|
|
"tps_std": 13.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.0,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 730.49,
|
|
"tps_std": 1.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.89,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1668.5,
|
|
"tps_std": 13.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.68,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 507.77,
|
|
"tps_std": 2.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.46,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1642.7,
|
|
"tps_std": 14.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.75,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 507.84,
|
|
"tps_std": 1.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.32,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1303.99,
|
|
"tps_std": 6.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.68,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 364.73,
|
|
"tps_std": 0.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 49.99,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1577.96,
|
|
"tps_std": 12.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.94,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 541.12,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 60.77,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1543.27,
|
|
"tps_std": 2.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.61,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 165.68,
|
|
"tps_std": 0.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1539.48,
|
|
"tps_std": 5.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.57,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.31,
|
|
"tps_std": 1.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1528.37,
|
|
"tps_std": 6.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.14,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 196.35,
|
|
"tps_std": 2.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1521.12,
|
|
"tps_std": 5.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.22,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 196.03,
|
|
"tps_std": 1.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1507.68,
|
|
"tps_std": 1.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.41,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 206.97,
|
|
"tps_std": 1.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1508.58,
|
|
"tps_std": 2.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.44,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 206.54,
|
|
"tps_std": 0.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 324.82,
|
|
"tps_std": 0.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.43,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 144.29,
|
|
"tps_std": 1.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.2,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1313.97,
|
|
"tps_std": 1.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.59,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 208.18,
|
|
"tps_std": 2.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.52,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2405d59cb",
|
|
"number": "8577"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 18.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 97.96,
|
|
"tps_std": 0.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 73.57,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.02,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 18.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 4.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 99.24,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 18.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 4.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 99.22,
|
|
"tps_std": 0.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 18.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 99.58,
|
|
"tps_std": 0.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 72.73,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_amdvlk__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_amdvlk__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_radv__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_radv__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 58.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 158.25,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7_2-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 59.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 159.79,
|
|
"tps_std": 0.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 64.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 169.3,
|
|
"tps_std": 0.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.93,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 65.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 169.5,
|
|
"tps_std": 1.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 60.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 171.03,
|
|
"tps_std": 0.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.98,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 60.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 173.91,
|
|
"tps_std": 0.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": null,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "e0c93af2a",
|
|
"number": "7938"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "load",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_amdvlk__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_amdvlk__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_radv__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_radv__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
}
|
|
]
|
|
} |