15226 lines
411 KiB
JSON
15226 lines
411 KiB
JSON
{
|
|
"meta": {
|
|
"generated_at": "2026-01-12T09:25:21Z",
|
|
"system_info": {
|
|
"distro": "Fedora Linux 42 (Workstation Edition)",
|
|
"kernel": "6.18.3-100.fc42.x86_64",
|
|
"linux_firmware": "linux-firmware-20251111-1.fc42.noarch",
|
|
"timestamp": "09 Jan 2026"
|
|
},
|
|
"llamacpp_builds": [
|
|
{
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
],
|
|
"environments": [
|
|
"rocm6_4_4",
|
|
"rocm6_4_4-hblt0",
|
|
"rocm7-nightlies",
|
|
"rocm7-nightlies-hblt0",
|
|
"rocm7.1.1",
|
|
"rocm7.1.1-hblt0",
|
|
"rocm7_rc",
|
|
"vulkan_amdvlk",
|
|
"vulkan_radv"
|
|
],
|
|
"notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second"
|
|
},
|
|
"runs": [
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 81.03,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 79.43,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.8,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 73.64,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.74,
|
|
"tps_std": 0.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 123.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 72.94,
|
|
"tps_std": 2.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 77.29,
|
|
"tps_std": 5.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.83,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 76.84,
|
|
"tps_std": 4.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.84,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 41.19,
|
|
"tps_std": 7.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 1.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 10.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 47.53,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.96,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 12.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 279.35,
|
|
"tps_std": 0.9,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 37.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 307.88,
|
|
"tps_std": 1.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 38.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 190.14,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 36.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 235.84,
|
|
"tps_std": 0.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 38.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 279.68,
|
|
"tps_std": 1.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 37.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 305.29,
|
|
"tps_std": 1.9,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.83,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 38.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 320.89,
|
|
"tps_std": 0.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 23.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 281.21,
|
|
"tps_std": 0.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.02,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 151.37,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 31.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.36,
|
|
"tps_std": 1.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 36.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 88.58,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 30.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 152.92,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 35.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.64,
|
|
"tps_std": 0.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 188.13,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 36.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 290.49,
|
|
"tps_std": 0.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 261.76,
|
|
"tps_std": 0.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.93,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 33.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 148.26,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 147.21,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 67.05,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 26.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 66.64,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 26.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 148.44,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 32.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.61,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 32.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 100.89,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 18.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 87.66,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 21.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 801.73,
|
|
"tps_std": 2.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 163.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 805.52,
|
|
"tps_std": 3.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 164.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 798.6,
|
|
"tps_std": 3.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 153.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 799.84,
|
|
"tps_std": 4.89,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 159.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 792.78,
|
|
"tps_std": 1.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 156.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 803.71,
|
|
"tps_std": 3.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 163.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 187.83,
|
|
"tps_std": 22.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 64.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.84,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 7.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 75.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1065.39,
|
|
"tps_std": 1.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.12,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 823.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1034.18,
|
|
"tps_std": 3.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.08,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 896.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 567.35,
|
|
"tps_std": 4.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.67,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 660.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 560.67,
|
|
"tps_std": 3.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 663.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1051.12,
|
|
"tps_std": 10.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 704.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1028.01,
|
|
"tps_std": 11.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 743.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1253.52,
|
|
"tps_std": 10.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 47.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 408.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1016.39,
|
|
"tps_std": 35.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.53,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 403.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 206.6,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 47.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 197.06,
|
|
"tps_std": 14.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 47.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 202.07,
|
|
"tps_std": 3.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 38.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 188.66,
|
|
"tps_std": 20.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 13.61,
|
|
"tps_std": 1.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 38.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 187.93,
|
|
"tps_std": 19.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.7,
|
|
"tps_std": 1.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 17.92,
|
|
"tps_std": 2.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 7.99,
|
|
"tps_std": 0.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 57.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 168.14,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.89,
|
|
"tps_std": 0.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 576.12,
|
|
"tps_std": 2.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 254.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 585.67,
|
|
"tps_std": 2.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 244.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 492.51,
|
|
"tps_std": 1.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 203.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 494.46,
|
|
"tps_std": 2.69,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 173.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 469.57,
|
|
"tps_std": 3.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 173.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 471.12,
|
|
"tps_std": 8.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.02,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 172.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 424.44,
|
|
"tps_std": 1.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 65.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 364.62,
|
|
"tps_std": 2.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 93.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1073.1,
|
|
"tps_std": 11.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.78,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 206.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1075.09,
|
|
"tps_std": 15.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.72,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 904.96,
|
|
"tps_std": 12.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 158.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 906.79,
|
|
"tps_std": 8.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 158.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 999.37,
|
|
"tps_std": 14.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1004.04,
|
|
"tps_std": 12.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.32,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 168.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1180.84,
|
|
"tps_std": 8.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 66.24,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 71.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1046.73,
|
|
"tps_std": 6.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.71,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 109.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1240.19,
|
|
"tps_std": 1.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.06,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 286.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1246.06,
|
|
"tps_std": 12.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.95,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 211.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1225.75,
|
|
"tps_std": 5.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.54,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 163.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1228.38,
|
|
"tps_std": 14.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.53,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 165.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1224.8,
|
|
"tps_std": 12.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.07,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 171.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1228.44,
|
|
"tps_std": 13.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.99,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 172.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1072.21,
|
|
"tps_std": 149.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 1.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 71.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1075.31,
|
|
"tps_std": 42.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 86.69,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 111.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 587.41,
|
|
"tps_std": 3.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 421.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 610.91,
|
|
"tps_std": 4.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.22,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 432.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 354.31,
|
|
"tps_std": 5.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.4,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 327.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 364.74,
|
|
"tps_std": 5.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.38,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 340.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 586.56,
|
|
"tps_std": 7.78,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.8,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 403.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 609.81,
|
|
"tps_std": 7.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.84,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 411.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 634.07,
|
|
"tps_std": 4.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 33.94,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 121.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 22.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 538.47,
|
|
"tps_std": 29.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 31.56,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 211.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 27.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 931.79,
|
|
"tps_std": 1.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 247.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 936.67,
|
|
"tps_std": 1.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 259.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 428.84,
|
|
"tps_std": 1.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 275.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 431.06,
|
|
"tps_std": 0.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 283.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 926.89,
|
|
"tps_std": 0.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 262.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 934.3,
|
|
"tps_std": 0.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 254.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 602.68,
|
|
"tps_std": 80.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 21.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 548.18,
|
|
"tps_std": 1.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 13.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 231.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 472.15,
|
|
"tps_std": 0.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 188.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 531.41,
|
|
"tps_std": 1.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 214.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 470.21,
|
|
"tps_std": 1.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 179.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 526.32,
|
|
"tps_std": 1.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 193.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 467.63,
|
|
"tps_std": 1.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 182.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 527.37,
|
|
"tps_std": 1.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 201.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 111.81,
|
|
"tps_std": 20.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 73.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 107.4,
|
|
"tps_std": 0.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 64.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2884.56,
|
|
"tps_std": 5.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 80.8,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1446.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 59.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2874.72,
|
|
"tps_std": 3.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 80.97,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1258.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 59.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2829.05,
|
|
"tps_std": 14.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 82.17,
|
|
"tps_std": 4.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1118.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 61.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2843.1,
|
|
"tps_std": 21.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 84.76,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1123.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 61.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2657.05,
|
|
"tps_std": 331.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 62.0,
|
|
"tps_std": 3.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1124.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 59.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2818.77,
|
|
"tps_std": 65.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 65.67,
|
|
"tps_std": 4.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1136.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 59.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1514.96,
|
|
"tps_std": 340.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.61,
|
|
"tps_std": 2.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 188.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 66.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1235.5,
|
|
"tps_std": 244.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.02,
|
|
"tps_std": 2.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 694.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 49.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 683.09,
|
|
"tps_std": 7.89,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 334.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 684.21,
|
|
"tps_std": 8.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 333.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 283.71,
|
|
"tps_std": 2.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 207.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 284.3,
|
|
"tps_std": 2.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 198.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 675.95,
|
|
"tps_std": 6.9,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.15,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 257.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 667.48,
|
|
"tps_std": 9.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 255.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 862.37,
|
|
"tps_std": 1.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 5.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 183.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 585.93,
|
|
"tps_std": 27.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.18,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 160.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1776.02,
|
|
"tps_std": 15.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.43,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 596.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1777.68,
|
|
"tps_std": 17.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.45,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 546.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 816.54,
|
|
"tps_std": 1.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.67,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 374.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 821.55,
|
|
"tps_std": 13.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 355.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 52.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1710.76,
|
|
"tps_std": 45.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.34,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 420.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 55.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1732.05,
|
|
"tps_std": 23.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 417.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 55.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1771.72,
|
|
"tps_std": 240.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 7.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 294.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1429.1,
|
|
"tps_std": 24.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 80.56,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 284.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1595.85,
|
|
"tps_std": 4.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.05,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 188.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1599.42,
|
|
"tps_std": 4.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 187.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 671.91,
|
|
"tps_std": 0.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.72,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 147.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 671.59,
|
|
"tps_std": 0.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.64,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 145.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies-hblt0",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1578.33,
|
|
"tps_std": 5.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.91,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 165.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1587.41,
|
|
"tps_std": 1.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.89,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 165.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1261.9,
|
|
"tps_std": 215.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 104.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1126.16,
|
|
"tps_std": 2.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.42,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 162.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "9c142e3a2",
|
|
"number": "7670"
|
|
}
|
|
}
|
|
]
|
|
} |