Added Qwen-3-Next benchmarks
This commit is contained in:
+951
-1
@@ -1,6 +1,6 @@
|
||||
{
|
||||
"meta": {
|
||||
"generated_at": "2025-11-19T07:33:18Z",
|
||||
"generated_at": "2025-11-28T15:55:43Z",
|
||||
"os_kernel": "Fedora 42 \u2014 Linux 6.15.9-201.fc42.x86_64 (Sat Aug 2 11:37:34 UTC 2025)",
|
||||
"llamacpp_builds": [
|
||||
{
|
||||
@@ -47,6 +47,10 @@
|
||||
"hash": "bca95ca51",
|
||||
"number": "7036"
|
||||
},
|
||||
{
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
},
|
||||
{
|
||||
"hash": "caca0d55c",
|
||||
"number": "7085"
|
||||
@@ -22776,6 +22780,952 @@
|
||||
"number": "7089"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm-7alpha-rocwmma",
|
||||
"env_base": "rocm",
|
||||
"env_variant": "7alpha-rocwmma",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 245.79,
|
||||
"tps_std": 0.39,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm-7alpha-rocwmma",
|
||||
"env_base": "rocm",
|
||||
"env_variant": "7alpha-rocwmma",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 19.3,
|
||||
"tps_std": 0.09,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm-7alpha-rocwmma-hblt0",
|
||||
"env_base": "rocm",
|
||||
"env_variant": "7alpha-rocwmma-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 301.76,
|
||||
"tps_std": 0.36,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm-7alpha-rocwmma-hblt0",
|
||||
"env_base": "rocm",
|
||||
"env_variant": "7alpha-rocwmma-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 23.98,
|
||||
"tps_std": 0.02,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm-7alpha",
|
||||
"env_base": "rocm",
|
||||
"env_variant": "7alpha",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 249.8,
|
||||
"tps_std": 4.99,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm-7alpha",
|
||||
"env_base": "rocm",
|
||||
"env_variant": "7alpha",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 19.17,
|
||||
"tps_std": 0.01,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm-7alpha-hblt0",
|
||||
"env_base": "rocm",
|
||||
"env_variant": "7alpha-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 305.05,
|
||||
"tps_std": 2.25,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm-7alpha-hblt0",
|
||||
"env_base": "rocm",
|
||||
"env_variant": "7alpha-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 23.99,
|
||||
"tps_std": 0.16,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm6_4_4-rocwmma",
|
||||
"env_base": "rocm6_4_4",
|
||||
"env_variant": "rocwmma",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 311.74,
|
||||
"tps_std": 3.86,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm6_4_4-rocwmma",
|
||||
"env_base": "rocm6_4_4",
|
||||
"env_variant": "rocwmma",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 22.66,
|
||||
"tps_std": 0.25,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm6_4_4-rocwmma-hblt0",
|
||||
"env_base": "rocm6_4_4",
|
||||
"env_variant": "rocwmma-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 313.2,
|
||||
"tps_std": 3.93,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm6_4_4-rocwmma-hblt0",
|
||||
"env_base": "rocm6_4_4",
|
||||
"env_variant": "rocwmma-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 23.02,
|
||||
"tps_std": 0.3,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm6_4_4",
|
||||
"env_base": "rocm6_4_4",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 320.42,
|
||||
"tps_std": 0.35,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm6_4_4",
|
||||
"env_base": "rocm6_4_4",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 23.06,
|
||||
"tps_std": 0.13,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm6_4_4-hblt0",
|
||||
"env_base": "rocm6_4_4",
|
||||
"env_variant": "hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": null,
|
||||
"tps_mean": null,
|
||||
"tps_std": null,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": null,
|
||||
"ngl": null,
|
||||
"mmap": null,
|
||||
"params_b": null,
|
||||
"file_size_gib": null,
|
||||
"name_params_b": 80.0,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": null
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7.1-rocwmma",
|
||||
"env_base": "rocm7.1",
|
||||
"env_variant": "rocwmma",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 258.3,
|
||||
"tps_std": 2.66,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7.1-rocwmma",
|
||||
"env_base": "rocm7.1",
|
||||
"env_variant": "rocwmma",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 18.49,
|
||||
"tps_std": 0.24,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7.1-rocwmma-hblt0",
|
||||
"env_base": "rocm7.1",
|
||||
"env_variant": "rocwmma-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 322.7,
|
||||
"tps_std": 2.1,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7.1-rocwmma-hblt0",
|
||||
"env_base": "rocm7.1",
|
||||
"env_variant": "rocwmma-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 23.45,
|
||||
"tps_std": 0.19,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7.1",
|
||||
"env_base": "rocm7.1",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 253.35,
|
||||
"tps_std": 2.88,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7.1",
|
||||
"env_base": "rocm7.1",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 18.25,
|
||||
"tps_std": 0.15,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7.1-hblt0",
|
||||
"env_base": "rocm7.1",
|
||||
"env_variant": "hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 319.09,
|
||||
"tps_std": 2.77,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7.1-hblt0",
|
||||
"env_base": "rocm7.1",
|
||||
"env_variant": "hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 23.72,
|
||||
"tps_std": 0.03,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7_rc-rocwmma",
|
||||
"env_base": "rocm7_rc",
|
||||
"env_variant": "rocwmma",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 254.34,
|
||||
"tps_std": 2.6,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7_rc-rocwmma",
|
||||
"env_base": "rocm7_rc",
|
||||
"env_variant": "rocwmma",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 18.06,
|
||||
"tps_std": 0.08,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7_rc-rocwmma-hblt0",
|
||||
"env_base": "rocm7_rc",
|
||||
"env_variant": "rocwmma-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 323.33,
|
||||
"tps_std": 1.75,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7_rc-rocwmma-hblt0",
|
||||
"env_base": "rocm7_rc",
|
||||
"env_variant": "rocwmma-hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 23.37,
|
||||
"tps_std": 0.17,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7_rc",
|
||||
"env_base": "rocm7_rc",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 242.43,
|
||||
"tps_std": 0.28,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7_rc",
|
||||
"env_base": "rocm7_rc",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 18.35,
|
||||
"tps_std": 0.1,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7_rc-hblt0",
|
||||
"env_base": "rocm7_rc",
|
||||
"env_variant": "hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 305.22,
|
||||
"tps_std": 3.1,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "rocm7_rc-hblt0",
|
||||
"env_base": "rocm7_rc",
|
||||
"env_variant": "hblt0",
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 23.6,
|
||||
"tps_std": 0.08,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "ROCm",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "vulkan_amdvlk",
|
||||
"env_base": "vulkan_amdvlk",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": null,
|
||||
"tps_mean": null,
|
||||
"tps_std": null,
|
||||
"error": true,
|
||||
"error_type": "load",
|
||||
"backend": null,
|
||||
"ngl": null,
|
||||
"mmap": null,
|
||||
"params_b": null,
|
||||
"file_size_gib": null,
|
||||
"name_params_b": 80.0,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
||||
"rpc": false,
|
||||
"build": null
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "vulkan_radv",
|
||||
"env_base": "vulkan_radv",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "pp512",
|
||||
"tps_mean": 324.45,
|
||||
"tps_std": 0.42,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "Vulkan",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
||||
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
||||
"env": "vulkan_radv",
|
||||
"env_base": "vulkan_radv",
|
||||
"env_variant": null,
|
||||
"fa": true,
|
||||
"context": "default",
|
||||
"context_tokens": null,
|
||||
"test": "tg128",
|
||||
"tps_mean": 22.31,
|
||||
"tps_std": 0.18,
|
||||
"error": false,
|
||||
"error_type": null,
|
||||
"backend": "Vulkan",
|
||||
"ngl": 99,
|
||||
"mmap": 0,
|
||||
"params_b": 79.67,
|
||||
"file_size_gib": 79.57,
|
||||
"name_params_b": 79.67,
|
||||
"quant": "Q8_K_XL",
|
||||
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
||||
"rpc": false,
|
||||
"build": {
|
||||
"hash": "c6f7a423c",
|
||||
"number": "7189"
|
||||
}
|
||||
},
|
||||
{
|
||||
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
||||
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
||||
|
||||
Reference in New Issue
Block a user