45534 lines
1.2 MiB
Plaintext
45534 lines
1.2 MiB
Plaintext
{
|
|
"meta": {
|
|
"generated_at": "2025-12-05T08:29:05Z",
|
|
"os_kernel": "Fedora 42 \u2014 Linux 6.15.9-201.fc42.x86_64 (Sat Aug 2 11:37:34 UTC 2025)",
|
|
"llamacpp_builds": [
|
|
{
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
},
|
|
{
|
|
"hash": "0a3857fe0",
|
|
"number": "7089"
|
|
},
|
|
{
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
},
|
|
{
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
},
|
|
{
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
},
|
|
{
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "ab5783eb4",
|
|
"number": "7089"
|
|
},
|
|
{
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
},
|
|
{
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
},
|
|
{
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
],
|
|
"environments": [
|
|
"rocm-7alpha",
|
|
"rocm-7alpha-hblt0",
|
|
"rocm-7alpha-rocwmma",
|
|
"rocm-7alpha-rocwmma-hblt0",
|
|
"rocm-7alpha-rocwmma-improved",
|
|
"rocm-7alpha-rocwmma-improved-hblt0",
|
|
"rocm6_4_4",
|
|
"rocm6_4_4-hblt0",
|
|
"rocm6_4_4-rocwmma",
|
|
"rocm6_4_4-rocwmma-hblt0",
|
|
"rocm7.1",
|
|
"rocm7.1-hblt0",
|
|
"rocm7.1-rocwmma",
|
|
"rocm7.1-rocwmma-hblt0",
|
|
"rocm7_rc",
|
|
"rocm7_rc-hblt0",
|
|
"rocm7_rc-rocwmma",
|
|
"rocm7_rc-rocwmma-hblt0",
|
|
"vulkan_amdvlk",
|
|
"vulkan_radv"
|
|
],
|
|
"notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second"
|
|
},
|
|
"runs": [
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 103.27,
|
|
"tps_std": 0.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 19.09,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 167.68,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.85,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 87.62,
|
|
"tps_std": 0.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 13.99,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 170.65,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 14.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 93.53,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 171.42,
|
|
"tps_std": 0.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 135.1,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 12.41,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 142.39,
|
|
"tps_std": 0.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.7,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 13.3,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 135.5,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 30.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 172.61,
|
|
"tps_std": 0.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 33.91,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 77.55,
|
|
"tps_std": 0.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 16.62,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.5,
|
|
"tps_std": 0.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.23,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 99.42,
|
|
"tps_std": 0.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 29.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 172.08,
|
|
"tps_std": 0.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 32.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 72.38,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 16.4,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 131.85,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.71,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.15,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 99.25,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.54,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 169.93,
|
|
"tps_std": 0.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 33.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 217.91,
|
|
"tps_std": 0.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.5,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 235.07,
|
|
"tps_std": 0.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.84,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 33.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 92.38,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 19.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 147.75,
|
|
"tps_std": 0.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 86.5,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 14.06,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 140.67,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 14.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 74.73,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 26.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 151.03,
|
|
"tps_std": 0.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 125.43,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.48,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 140.41,
|
|
"tps_std": 0.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.52,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 13.2,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 130.63,
|
|
"tps_std": 0.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 26.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.79,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.57,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 33.65,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 69.31,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.5,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.07,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 136.65,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.46,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.05,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 94.32,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.25,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 130.72,
|
|
"tps_std": 0.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.54,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 114.56,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 16.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 159.14,
|
|
"tps_std": 0.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.44,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.46,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 96.45,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 130.86,
|
|
"tps_std": 0.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.53,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 36.62,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 261.54,
|
|
"tps_std": 1.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 23.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 233.87,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.74,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 33.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 103.85,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 19.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 101.51,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 19.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 103.65,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 12.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 103.07,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 12.71,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 105.64,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 33.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 102.84,
|
|
"tps_std": 0.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 102.56,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 11.74,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 103.23,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 11.69,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 105.28,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 70.0,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 104.32,
|
|
"tps_std": 0.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 102.8,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 15.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 102.92,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 15.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 103.28,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 104.3,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 35.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 103.21,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 15.05,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 96.88,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 15.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 104.95,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 32.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 97.99,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 70.0,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 98.55,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 18.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 86.56,
|
|
"tps_std": 0.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 263.94,
|
|
"tps_std": 2.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 155.11,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 152.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 273.53,
|
|
"tps_std": 2.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.17,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 109.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 274.07,
|
|
"tps_std": 3.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 109.44,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 273.71,
|
|
"tps_std": 1.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 188.24,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 289.25,
|
|
"tps_std": 1.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.16,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 102.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 292.12,
|
|
"tps_std": 0.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 99.11,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 290.6,
|
|
"tps_std": 0.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 201.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 292.38,
|
|
"tps_std": 1.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 293.23,
|
|
"tps_std": 0.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 128.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 287.19,
|
|
"tps_std": 1.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 132.25,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.62,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 294.05,
|
|
"tps_std": 2.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.17,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 201.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 292.59,
|
|
"tps_std": 1.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.16,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 126.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 287.84,
|
|
"tps_std": 2.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 127.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 292.02,
|
|
"tps_std": 1.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 207.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 282.7,
|
|
"tps_std": 0.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.15,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 202.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 224.36,
|
|
"tps_std": 2.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 84.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 211.78,
|
|
"tps_std": 1.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 85.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q6_K",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 82.35,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q6_K",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q6_K-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 272.42,
|
|
"tps_std": 2.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 149.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 271.67,
|
|
"tps_std": 1.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.13,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 153.04,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 273.57,
|
|
"tps_std": 2.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 108.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 269.91,
|
|
"tps_std": 0.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.11,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 107.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 274.27,
|
|
"tps_std": 3.87,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 190.45,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 296.39,
|
|
"tps_std": 0.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 100.8,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 295.81,
|
|
"tps_std": 2.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 99.06,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 295.53,
|
|
"tps_std": 3.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 208.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 298.3,
|
|
"tps_std": 1.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 295.26,
|
|
"tps_std": 1.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 124.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 292.62,
|
|
"tps_std": 1.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 124.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 296.33,
|
|
"tps_std": 1.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 296.32,
|
|
"tps_std": 1.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 202.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 291.43,
|
|
"tps_std": 1.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.16,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 127.05,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 287.94,
|
|
"tps_std": 1.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 127.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 268.04,
|
|
"tps_std": 46.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 287.0,
|
|
"tps_std": 2.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 202.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 349.58,
|
|
"tps_std": 2.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 99.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 280.28,
|
|
"tps_std": 1.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 12.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 106.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-Q8_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 106.65,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q8_0",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-Q8_0-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 313.68,
|
|
"tps_std": 2.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 154.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 312.46,
|
|
"tps_std": 3.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 311.89,
|
|
"tps_std": 2.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 109.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 313.81,
|
|
"tps_std": 0.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 109.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 314.61,
|
|
"tps_std": 2.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 315.62,
|
|
"tps_std": 2.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 308.87,
|
|
"tps_std": 1.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.54,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 101.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 306.69,
|
|
"tps_std": 2.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.58,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 100.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 308.5,
|
|
"tps_std": 4.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 209.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 308.24,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 217.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 304.34,
|
|
"tps_std": 2.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.61,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 138.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 305.86,
|
|
"tps_std": 2.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.55,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 134.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 306.39,
|
|
"tps_std": 1.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 198.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 309.0,
|
|
"tps_std": 2.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 201.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 305.09,
|
|
"tps_std": 1.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.58,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 136.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 292.67,
|
|
"tps_std": 0.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.6,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 131.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 302.22,
|
|
"tps_std": 1.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.58,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 196.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 300.96,
|
|
"tps_std": 2.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.57,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 17.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.52,
|
|
"tps_std": 1.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 20.65,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 81.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 13.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 230.79,
|
|
"tps_std": 1.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 20.79,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 89.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 107.77,
|
|
"file_size_gib": 57.73,
|
|
"name_params_b": 107.77,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Llama-4-Scout-17B-16E-Instruct-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 141.46,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 48.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 140.4,
|
|
"tps_std": 0.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.93,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 49.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 143.18,
|
|
"tps_std": 0.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 28.32,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 142.52,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.13,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 29.46,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.03,
|
|
"tps_std": 1.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 38.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 140.69,
|
|
"tps_std": 0.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.07,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 38.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 143.65,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 24.32,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 142.82,
|
|
"tps_std": 1.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.11,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 24.0,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.45,
|
|
"tps_std": 0.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.88,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 47.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.3,
|
|
"tps_std": 1.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 48.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.51,
|
|
"tps_std": 1.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.16,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 27.99,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.56,
|
|
"tps_std": 0.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 27.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.23,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 39.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.0,
|
|
"tps_std": 0.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 40.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.65,
|
|
"tps_std": 0.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 27.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 142.7,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 28.48,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.17,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 39.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 143.77,
|
|
"tps_std": 0.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 139.19,
|
|
"tps_std": 0.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.45,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 16.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 128.55,
|
|
"tps_std": 1.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.47,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 478.1,
|
|
"tps_std": 4.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.92,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 197.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 352.23,
|
|
"tps_std": 9.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 192.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 483.01,
|
|
"tps_std": 4.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 147.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 345.22,
|
|
"tps_std": 23.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.84,
|
|
"tps_std": 0.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 135.26,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 482.27,
|
|
"tps_std": 5.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 164.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 360.93,
|
|
"tps_std": 3.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 197.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 479.75,
|
|
"tps_std": 5.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 107.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 360.25,
|
|
"tps_std": 7.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.84,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 107.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 493.29,
|
|
"tps_std": 1.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 208.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 362.53,
|
|
"tps_std": 2.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 244.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 484.23,
|
|
"tps_std": 1.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 131.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 357.45,
|
|
"tps_std": 1.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 127.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 485.6,
|
|
"tps_std": 4.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.98,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 174.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 360.51,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 174.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 472.32,
|
|
"tps_std": 1.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.13,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 129.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 348.39,
|
|
"tps_std": 4.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 125.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 12.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 487.44,
|
|
"tps_std": 3.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 194.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 350.49,
|
|
"tps_std": 4.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 174.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 191.31,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 53.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 165.85,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.35,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 73.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 573.35,
|
|
"tps_std": 5.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 201.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 579.57,
|
|
"tps_std": 12.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 202.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 568.92,
|
|
"tps_std": 3.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.4,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 147.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 575.31,
|
|
"tps_std": 5.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.66,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 145.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 574.31,
|
|
"tps_std": 5.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 160.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 576.33,
|
|
"tps_std": 7.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.48,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 160.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 622.81,
|
|
"tps_std": 3.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.81,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 109.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 625.44,
|
|
"tps_std": 4.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 108.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 640.29,
|
|
"tps_std": 6.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 56.58,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 203.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 632.09,
|
|
"tps_std": 4.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 620.61,
|
|
"tps_std": 2.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.85,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 131.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 617.37,
|
|
"tps_std": 6.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.82,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 132.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 628.16,
|
|
"tps_std": 1.9,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.33,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 167.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 628.24,
|
|
"tps_std": 3.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.33,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 169.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 625.38,
|
|
"tps_std": 1.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.11,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 131.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 616.46,
|
|
"tps_std": 1.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.69,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 132.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 625.22,
|
|
"tps_std": 5.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 168.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 626.37,
|
|
"tps_std": 6.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 170.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1013.46,
|
|
"tps_std": 4.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 62.1,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 69.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 853.23,
|
|
"tps_std": 3.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 66.93,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 104.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 29.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 673.5,
|
|
"tps_std": 8.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 70.76,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 669.29,
|
|
"tps_std": 4.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.1,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 674.15,
|
|
"tps_std": 10.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.14,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 150.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 666.63,
|
|
"tps_std": 5.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.62,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 148.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 675.1,
|
|
"tps_std": 3.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.06,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 161.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 676.38,
|
|
"tps_std": 1.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.44,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 160.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 663.26,
|
|
"tps_std": 2.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.79,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 108.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 655.75,
|
|
"tps_std": 5.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.7,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 109.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 674.37,
|
|
"tps_std": 11.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 67.62,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 665.28,
|
|
"tps_std": 7.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.57,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 649.91,
|
|
"tps_std": 5.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.03,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 132.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 658.06,
|
|
"tps_std": 8.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.11,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 132.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 662.81,
|
|
"tps_std": 8.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.77,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 167.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 660.13,
|
|
"tps_std": 8.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.73,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 169.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 650.55,
|
|
"tps_std": 3.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 132.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 647.31,
|
|
"tps_std": 2.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.01,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 131.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 660.75,
|
|
"tps_std": 2.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.92,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 662.51,
|
|
"tps_std": 3.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 170.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 774.61,
|
|
"tps_std": 2.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.31,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 68.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 832.44,
|
|
"tps_std": 3.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 87.24,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 100.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 602.73,
|
|
"tps_std": 3.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.21,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 201.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 587.21,
|
|
"tps_std": 4.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 200.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 601.39,
|
|
"tps_std": 7.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.54,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 145.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 585.7,
|
|
"tps_std": 2.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.59,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 148.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 601.34,
|
|
"tps_std": 1.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 160.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 585.58,
|
|
"tps_std": 4.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.38,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 163.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 652.89,
|
|
"tps_std": 1.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.1,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 110.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 638.38,
|
|
"tps_std": 7.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 108.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 648.39,
|
|
"tps_std": 23.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.52,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 218.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 640.53,
|
|
"tps_std": 6.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.87,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 207.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 650.26,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.8,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 132.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 634.84,
|
|
"tps_std": 9.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.78,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 131.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 649.99,
|
|
"tps_std": 3.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.58,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 640.61,
|
|
"tps_std": 7.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.69,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 171.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 648.21,
|
|
"tps_std": 4.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.85,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 131.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 631.07,
|
|
"tps_std": 4.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.89,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 131.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 654.79,
|
|
"tps_std": 1.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.22,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 237.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 633.61,
|
|
"tps_std": 5.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 44.67,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 221.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1152.51,
|
|
"tps_std": 1.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ab5783eb4",
|
|
"number": "7089"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.58,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ab5783eb4",
|
|
"number": "7089"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 71.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ab5783eb4",
|
|
"number": "7089"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ab5783eb4",
|
|
"number": "7089"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 916.61,
|
|
"tps_std": 3.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "0a3857fe0",
|
|
"number": "7089"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.81,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "0a3857fe0",
|
|
"number": "7089"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 108.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "0a3857fe0",
|
|
"number": "7089"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 33.51,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "0a3857fe0",
|
|
"number": "7089"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 248.51,
|
|
"tps_std": 1.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.33,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 302.76,
|
|
"tps_std": 0.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.42,
|
|
"tps_std": 0.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 242.26,
|
|
"tps_std": 2.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.98,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 287.99,
|
|
"tps_std": 2.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.05,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 318.5,
|
|
"tps_std": 0.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.75,
|
|
"tps_std": 0.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 325.56,
|
|
"tps_std": 2.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.95,
|
|
"tps_std": 0.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 320.64,
|
|
"tps_std": 0.8,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.55,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 325.06,
|
|
"tps_std": 1.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.14,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 264.35,
|
|
"tps_std": 7.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.89,
|
|
"tps_std": 0.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 321.93,
|
|
"tps_std": 4.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.64,
|
|
"tps_std": 1.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 256.63,
|
|
"tps_std": 1.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.18,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 324.95,
|
|
"tps_std": 0.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.54,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 255.48,
|
|
"tps_std": 2.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.31,
|
|
"tps_std": 0.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 327.95,
|
|
"tps_std": 1.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.64,
|
|
"tps_std": 1.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 264.12,
|
|
"tps_std": 2.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.94,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 328.73,
|
|
"tps_std": 4.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.46,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 417.28,
|
|
"tps_std": 0.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.31,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 333.74,
|
|
"tps_std": 1.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.76,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "03d9a77b8",
|
|
"number": "7278"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 751.05,
|
|
"tps_std": 61.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 323.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 799.75,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 335.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 795.35,
|
|
"tps_std": 0.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 354.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 804.75,
|
|
"tps_std": 0.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 369.35,
|
|
"tps_std": 42.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 816.42,
|
|
"tps_std": 1.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 345.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 826.54,
|
|
"tps_std": 0.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 371.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 811.49,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 151.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 819.41,
|
|
"tps_std": 1.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 149.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 826.24,
|
|
"tps_std": 1.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 267.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 833.1,
|
|
"tps_std": 1.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 252.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 797.32,
|
|
"tps_std": 10.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 180.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 810.77,
|
|
"tps_std": 1.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 819.82,
|
|
"tps_std": 2.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 269.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 832.48,
|
|
"tps_std": 2.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 266.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 802.23,
|
|
"tps_std": 0.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 167.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 790.38,
|
|
"tps_std": 0.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 170.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 813.63,
|
|
"tps_std": 8.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.21,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 265.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 813.23,
|
|
"tps_std": 0.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 252.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 590.41,
|
|
"tps_std": 71.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 11.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 533.84,
|
|
"tps_std": 0.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 13.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 219.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 439.12,
|
|
"tps_std": 31.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 112.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 513.7,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 115.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 428.59,
|
|
"tps_std": 48.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 93.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 527.23,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 95.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 409.77,
|
|
"tps_std": 60.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 192.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 528.54,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 199.09,
|
|
"tps_std": 3.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 469.22,
|
|
"tps_std": 0.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 92.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 524.21,
|
|
"tps_std": 1.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 93.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 472.47,
|
|
"tps_std": 0.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 182.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 530.73,
|
|
"tps_std": 0.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 204.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 463.62,
|
|
"tps_std": 0.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 113.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 522.69,
|
|
"tps_std": 0.87,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 115.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 434.79,
|
|
"tps_std": 46.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 179.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 524.39,
|
|
"tps_std": 1.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 195.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 463.45,
|
|
"tps_std": 0.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 111.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 499.44,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 115.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 470.06,
|
|
"tps_std": 0.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 177.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 501.79,
|
|
"tps_std": 0.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 198.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "load",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "load",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 106.82,
|
|
"tps_std": 1.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 62.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2224.91,
|
|
"tps_std": 1.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 75.58,
|
|
"tps_std": 9.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1239.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 59.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2106.39,
|
|
"tps_std": 2.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 84.35,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1185.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 59.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2245.25,
|
|
"tps_std": 4.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 75.82,
|
|
"tps_std": 8.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1224.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 58.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2111.57,
|
|
"tps_std": 5.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1190.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 58.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2256.38,
|
|
"tps_std": 8.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 84.67,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1206.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 59.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2154.09,
|
|
"tps_std": 4.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 84.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1291.24,
|
|
"tps_std": 6.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 59.61,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2283.48,
|
|
"tps_std": 2.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.74,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 898.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2154.45,
|
|
"tps_std": 10.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 76.62,
|
|
"tps_std": 3.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 855.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2276.8,
|
|
"tps_std": 11.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 82.07,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1497.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 58.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2161.24,
|
|
"tps_std": 6.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 82.35,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1440.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 58.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2269.02,
|
|
"tps_std": 4.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 59.93,
|
|
"tps_std": 6.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1031.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2141.35,
|
|
"tps_std": 2.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 64.63,
|
|
"tps_std": 11.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1002.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2261.65,
|
|
"tps_std": 12.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 62.69,
|
|
"tps_std": 7.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1160.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 58.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2171.0,
|
|
"tps_std": 3.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 65.68,
|
|
"tps_std": 10.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1240.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 58.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2257.61,
|
|
"tps_std": 5.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.84,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1046.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2102.34,
|
|
"tps_std": 8.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 67.4,
|
|
"tps_std": 10.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1033.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2275.52,
|
|
"tps_std": 10.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.45,
|
|
"tps_std": 10.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1168.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 58.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2114.7,
|
|
"tps_std": 2.89,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.07,
|
|
"tps_std": 12.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 1227.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 58.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1229.75,
|
|
"tps_std": 236.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 75.94,
|
|
"tps_std": 2.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 145.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 64.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1116.46,
|
|
"tps_std": 204.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.27,
|
|
"tps_std": 2.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 646.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 45.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 669.82,
|
|
"tps_std": 4.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.4,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 325.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 673.38,
|
|
"tps_std": 9.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 332.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 656.31,
|
|
"tps_std": 30.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 223.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 680.04,
|
|
"tps_std": 3.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 224.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 667.33,
|
|
"tps_std": 4.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 262.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 674.51,
|
|
"tps_std": 4.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 335.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 778.24,
|
|
"tps_std": 5.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.19,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 301.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 783.56,
|
|
"tps_std": 11.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.18,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 276.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 16.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 779.12,
|
|
"tps_std": 1.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 36.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 335.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 774.77,
|
|
"tps_std": 13.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 454.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 30.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 769.93,
|
|
"tps_std": 0.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.36,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 223.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 771.12,
|
|
"tps_std": 3.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 226.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 757.6,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 270.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 29.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 763.2,
|
|
"tps_std": 10.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 283.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 29.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 775.86,
|
|
"tps_std": 2.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.4,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 225.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 776.83,
|
|
"tps_std": 4.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 223.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 13.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 750.63,
|
|
"tps_std": 5.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 281.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 29.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 756.08,
|
|
"tps_std": 9.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 37.06,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 284.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 29.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 720.94,
|
|
"tps_std": 1.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 35.76,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 513.71,
|
|
"tps_std": 2.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 34.86,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 157.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-F16",
|
|
"model_clean": "gpt-oss-120b-F16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 60.87,
|
|
"name_params_b": 116.83,
|
|
"quant": "F16",
|
|
"log": "results/gpt-oss-120b-F16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 673.11,
|
|
"tps_std": 6.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 331.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 675.94,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 326.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 27.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 665.6,
|
|
"tps_std": 9.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.94,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 224.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 639.77,
|
|
"tps_std": 57.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 224.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 652.18,
|
|
"tps_std": 8.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 254.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 35.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 657.18,
|
|
"tps_std": 7.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 336.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 35.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 767.82,
|
|
"tps_std": 6.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.71,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 301.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 782.34,
|
|
"tps_std": 9.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 293.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 762.33,
|
|
"tps_std": 0.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 341.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 778.37,
|
|
"tps_std": 3.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.63,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 358.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 755.98,
|
|
"tps_std": 7.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.78,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 226.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 766.72,
|
|
"tps_std": 15.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 225.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 742.07,
|
|
"tps_std": 2.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 263.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 763.92,
|
|
"tps_std": 4.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.34,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 367.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 753.49,
|
|
"tps_std": 1.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.76,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 226.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 774.4,
|
|
"tps_std": 6.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.74,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 226.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 746.02,
|
|
"tps_std": 1.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.2,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 274.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 752.08,
|
|
"tps_std": 9.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.38,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 284.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 38.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 759.84,
|
|
"tps_std": 2.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.66,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 169.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 534.51,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 54.67,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 159.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 37.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1430.02,
|
|
"tps_std": 3.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 551.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 24.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1438.05,
|
|
"tps_std": 10.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 555.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 24.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1494.1,
|
|
"tps_std": 6.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 357.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1450.79,
|
|
"tps_std": 15.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 357.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1430.88,
|
|
"tps_std": 12.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 419.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 24.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1399.32,
|
|
"tps_std": 6.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 556.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 24.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1500.8,
|
|
"tps_std": 17.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 479.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1440.0,
|
|
"tps_std": 14.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 478.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1449.04,
|
|
"tps_std": 10.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 619.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1444.02,
|
|
"tps_std": 15.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 612.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1499.09,
|
|
"tps_std": 21.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 350.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1448.72,
|
|
"tps_std": 23.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 352.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1437.87,
|
|
"tps_std": 9.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 443.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1405.44,
|
|
"tps_std": 19.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 454.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1486.29,
|
|
"tps_std": 11.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 352.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1426.84,
|
|
"tps_std": 4.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 351.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1424.62,
|
|
"tps_std": 5.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 446.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1380.59,
|
|
"tps_std": 26.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.29,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 465.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 25.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 574.29,
|
|
"tps_std": 4.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 221.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 448.9,
|
|
"tps_std": 3.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.15,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 243.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-F32",
|
|
"model_clean": "gpt-oss-20b-F32",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 38.97,
|
|
"name_params_b": 20.91,
|
|
"quant": "F32",
|
|
"log": "results/gpt-oss-20b-F32__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1333.81,
|
|
"tps_std": 9.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.64,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 537.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1385.54,
|
|
"tps_std": 24.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 544.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1384.08,
|
|
"tps_std": 13.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.16,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 349.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1419.39,
|
|
"tps_std": 12.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.24,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 353.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1326.8,
|
|
"tps_std": 18.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.5,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 398.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1365.89,
|
|
"tps_std": 19.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.49,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 456.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1510.54,
|
|
"tps_std": 2.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 474.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1598.15,
|
|
"tps_std": 4.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.02,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 477.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1510.09,
|
|
"tps_std": 10.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 518.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1572.54,
|
|
"tps_std": 11.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.96,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 554.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 56.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1511.0,
|
|
"tps_std": 19.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.04,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 345.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1559.27,
|
|
"tps_std": 17.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.16,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 349.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1476.67,
|
|
"tps_std": 4.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 418.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 54.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1526.6,
|
|
"tps_std": 21.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.45,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 431.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 54.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1507.89,
|
|
"tps_std": 10.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.07,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 345.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1558.14,
|
|
"tps_std": 14.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.06,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 349.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1463.05,
|
|
"tps_std": 15.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.34,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 422.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 54.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1513.62,
|
|
"tps_std": 5.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.47,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 435.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 54.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1681.86,
|
|
"tps_std": 231.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 75.38,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 300.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 46.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1354.58,
|
|
"tps_std": 9.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 77.1,
|
|
"tps_std": 0.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 298.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 52.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-uncensored.Q8_0",
|
|
"model_clean": "gpt-oss-20b-uncensored.Q8_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q8_0",
|
|
"log": "results/gpt-oss-20b-uncensored.Q8_0__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-uncensored.Q8_0",
|
|
"model_clean": "gpt-oss-20b-uncensored.Q8_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q8_0",
|
|
"log": "results/gpt-oss-20b-uncensored.Q8_0__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1091.87,
|
|
"tps_std": 1.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma-improved__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 54.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma-improved__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "31df4608",
|
|
"number": "7038"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1008.52,
|
|
"tps_std": 2.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.29,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma-improved__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 53.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma-improved__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1117.58,
|
|
"tps_std": 1.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.47,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 47.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1012.09,
|
|
"tps_std": 1.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.61,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 46.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1119.14,
|
|
"tps_std": 0.89,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.51,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 167.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1017.17,
|
|
"tps_std": 2.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.53,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1113.73,
|
|
"tps_std": 1.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 49.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1014.02,
|
|
"tps_std": 2.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.96,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 49.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1116.12,
|
|
"tps_std": 3.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.11,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 186.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1021.92,
|
|
"tps_std": 1.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.07,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 188.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1100.61,
|
|
"tps_std": 4.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 70.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1007.54,
|
|
"tps_std": 4.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 70.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1107.98,
|
|
"tps_std": 1.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.05,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 171.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1015.07,
|
|
"tps_std": 2.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.0,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 174.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ee8dd5c65",
|
|
"number": "7035"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1100.81,
|
|
"tps_std": 1.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 69.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 963.09,
|
|
"tps_std": 2.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.02,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 71.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "bca95ca51",
|
|
"number": "7036"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1113.49,
|
|
"tps_std": 3.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.02,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 177.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 968.65,
|
|
"tps_std": 2.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.01,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 173.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__hblt0__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1378.42,
|
|
"tps_std": 1.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 53.41,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 101.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 9.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1094.33,
|
|
"tps_std": 3.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 53.65,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 174.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "1c398dc9e",
|
|
"number": "7034"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 6.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 64.83,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.69,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 6.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 50.19,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 16.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 66.04,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 13.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 50.78,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 8.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 62.7,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.71,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 8.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 45.01,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 65.83,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 42.96,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 10.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 61.63,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.92,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 9.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 36.76,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.93,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 6.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 66.33,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 6.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 30.17,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.05,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 12.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 31.42,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.08,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 8.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 63.23,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.7,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 8.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 30.12,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 63.17,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 36.22,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.71,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 20.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 172.03,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.02,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 20.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 174.52,
|
|
"tps_std": 1.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.94,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 56.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 171.93,
|
|
"tps_std": 1.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.06,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 55.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 174.45,
|
|
"tps_std": 1.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.02,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 29.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 170.89,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.89,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 28.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 173.53,
|
|
"tps_std": 1.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-rocwmma",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.92,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 61.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 172.01,
|
|
"tps_std": 0.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1-hblt0",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.95,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 59.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 173.9,
|
|
"tps_std": 0.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7.1",
|
|
"env_base": "rocm7.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.95,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 142.82,
|
|
"tps_std": 0.78,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.85,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.47,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.86,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 143.05,
|
|
"tps_std": 1.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.0,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.6,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.94,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 55.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.59,
|
|
"tps_std": 0.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.01,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 55.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.21,
|
|
"tps_std": 2.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.05,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 29.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 170.42,
|
|
"tps_std": 0.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.88,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 29.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 174.42,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.87,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 57.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 171.34,
|
|
"tps_std": 0.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.97,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 173.98,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.94,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_amdvlk__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
}
|
|
]
|
|
} |