34623 lines
939 KiB
JSON
34623 lines
939 KiB
JSON
{
|
|
"meta": {
|
|
"generated_at": "2025-12-21T18:48:48Z",
|
|
"os_kernel": "Fedora 42 \u2014 Linux 6.15.9-201.fc42.x86_64 (Sat Aug 2 11:37:34 UTC 2025)",
|
|
"llamacpp_builds": [
|
|
{
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
},
|
|
{
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
},
|
|
{
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
},
|
|
{
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
],
|
|
"environments": [
|
|
"rocm-7alpha",
|
|
"rocm-7alpha-hblt0",
|
|
"rocm-7alpha-rocwmma",
|
|
"rocm-7alpha-rocwmma-hblt0",
|
|
"rocm-7alpha-rocwmma-improved",
|
|
"rocm-7alpha-rocwmma-improved-hblt0",
|
|
"rocm6_4_4",
|
|
"rocm6_4_4-hblt0",
|
|
"rocm6_4_4-rocwmma",
|
|
"rocm6_4_4-rocwmma-hblt0",
|
|
"rocm7.1.1",
|
|
"rocm7.1.1-hblt0",
|
|
"rocm7.1.1-rocwmma",
|
|
"rocm7.1.1-rocwmma-hblt0",
|
|
"rocm7_1",
|
|
"rocm7_1-hblt0",
|
|
"rocm7_1-rocwmma",
|
|
"rocm7_1-rocwmma-hblt0",
|
|
"rocm7_rc",
|
|
"rocm7_rc-hblt0",
|
|
"rocm7_rc-rocwmma",
|
|
"rocm7_rc-rocwmma-hblt0",
|
|
"vulkan_amdvlk",
|
|
"vulkan_radv"
|
|
],
|
|
"notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second"
|
|
},
|
|
"runs": [
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 247.81,
|
|
"tps_std": 0.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.45,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 37.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 246.64,
|
|
"tps_std": 0.87,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 37.54,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 250.33,
|
|
"tps_std": 0.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 84.5,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 250.13,
|
|
"tps_std": 0.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 330.74,
|
|
"tps_std": 2.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 33.8,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 330.13,
|
|
"tps_std": 0.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 33.91,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 333.45,
|
|
"tps_std": 1.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 98.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 336.2,
|
|
"tps_std": 2.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 98.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 323.36,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 47.07,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 323.91,
|
|
"tps_std": 1.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 46.62,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 330.9,
|
|
"tps_std": 1.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 329.23,
|
|
"tps_std": 1.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 323.77,
|
|
"tps_std": 1.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 46.38,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 323.19,
|
|
"tps_std": 0.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.69,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 46.51,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 330.87,
|
|
"tps_std": 0.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 330.19,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 228.89,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.48,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 40.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 9.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 243.57,
|
|
"tps_std": 0.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 52.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "GLM-4.5-Air-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 14.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 68.01,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 194.43,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 36.61,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.23,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 36.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.45,
|
|
"tps_std": 0.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.5,
|
|
"tps_std": 0.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.71,
|
|
"tps_std": 0.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 275.04,
|
|
"tps_std": 0.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 33.7,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 272.75,
|
|
"tps_std": 1.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 33.85,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 277.38,
|
|
"tps_std": 0.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 92.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 11.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 277.33,
|
|
"tps_std": 0.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 92.73,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 254.32,
|
|
"tps_std": 0.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 46.17,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 253.04,
|
|
"tps_std": 1.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 46.53,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 257.7,
|
|
"tps_std": 0.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 259.4,
|
|
"tps_std": 0.46,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 254.22,
|
|
"tps_std": 1.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 45.9,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 253.25,
|
|
"tps_std": 1.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 45.93,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 258.89,
|
|
"tps_std": 0.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 79.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 10.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 279.25,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.61,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 42.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 244.36,
|
|
"tps_std": 0.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 54.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003",
|
|
"model_clean": "GLM-4.5-Air-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 11.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 110.47,
|
|
"file_size_gib": 94.57,
|
|
"name_params_b": 110.47,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/GLM-4.5-Air-UD-Q6_K_XL-00001-of-00003__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 65.74,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 23.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 1.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 65.41,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 24.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 1.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 65.85,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 37.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 2.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 65.38,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 37.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 2.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.84,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 26.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 1.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.36,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 26.46,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.01,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 56.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 2.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.28,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 56.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 2.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.01,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 35.23,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 143.94,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 34.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 1.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 147.07,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 70.0,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.12,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 52.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 2.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.84,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 35.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 1.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 143.47,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 35.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 1.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.96,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 70.0,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.24,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 52.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 2.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 100.73,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 30.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 2.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 88.29,
|
|
"tps_std": 0.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 31.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 2.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 70.55,
|
|
"file_size_gib": 75.65,
|
|
"name_params_b": 70.55,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 788.05,
|
|
"tps_std": 2.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 139.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 5.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 787.49,
|
|
"tps_std": 3.69,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 136.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 5.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 799.32,
|
|
"tps_std": 2.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 273.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 804.49,
|
|
"tps_std": 4.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 282.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 792.57,
|
|
"tps_std": 2.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 121.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 6.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 794.96,
|
|
"tps_std": 3.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 118.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 6.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 802.78,
|
|
"tps_std": 0.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 289.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 810.15,
|
|
"tps_std": 2.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 316.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 781.49,
|
|
"tps_std": 1.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 176.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 6.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 795.45,
|
|
"tps_std": 1.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 179.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 6.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 797.09,
|
|
"tps_std": 3.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 261.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 800.44,
|
|
"tps_std": 2.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 282.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 794.13,
|
|
"tps_std": 2.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 177.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 6.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 757.71,
|
|
"tps_std": 0.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 175.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 6.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 803.93,
|
|
"tps_std": 1.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 266.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 767.62,
|
|
"tps_std": 3.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 280.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 7.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 228.96,
|
|
"tps_std": 0.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 101.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 6.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 198.3,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 7.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 98.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 6.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 575.9,
|
|
"tps_std": 0.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 815.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 37.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 566.25,
|
|
"tps_std": 5.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.75,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 818.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 37.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 573.96,
|
|
"tps_std": 1.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 840.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 40.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 568.52,
|
|
"tps_std": 6.46,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 842.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 40.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1111.52,
|
|
"tps_std": 3.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1161.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 38.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1075.82,
|
|
"tps_std": 2.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.19,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1159.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 38.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1111.9,
|
|
"tps_std": 4.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.13,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1083.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1074.4,
|
|
"tps_std": 7.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.17,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1126.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1110.04,
|
|
"tps_std": 2.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.43,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1034.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 38.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1073.92,
|
|
"tps_std": 6.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1041.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 38.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1119.24,
|
|
"tps_std": 8.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 964.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 40.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1086.57,
|
|
"tps_std": 5.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.44,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 972.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 40.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1100.11,
|
|
"tps_std": 6.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.51,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1036.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 38.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1066.41,
|
|
"tps_std": 6.56,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1030.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 38.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1110.36,
|
|
"tps_std": 6.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.23,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1042.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 40.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1074.73,
|
|
"tps_std": 4.78,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1001.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 40.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1224.54,
|
|
"tps_std": 7.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.56,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 569.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 940.69,
|
|
"tps_std": 5.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.38,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 489.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 31.58,
|
|
"file_size_gib": 37.66,
|
|
"name_params_b": 31.58,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.33,
|
|
"tps_std": 3.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.05,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 73.22,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.28,
|
|
"tps_std": 1.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 72.86,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 194.82,
|
|
"tps_std": 1.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 63.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 10.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 196.8,
|
|
"tps_std": 1.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.01,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 65.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 11.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 198.21,
|
|
"tps_std": 1.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.09,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 66.78,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 202.49,
|
|
"tps_std": 1.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 69.68,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 205.39,
|
|
"tps_std": 1.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 201.21,
|
|
"tps_std": 1.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 197.07,
|
|
"tps_std": 0.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 65.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 5.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 195.14,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.08,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 64.99,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 199.48,
|
|
"tps_std": 2.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.91,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 197.33,
|
|
"tps_std": 0.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 62.78,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 199.34,
|
|
"tps_std": 1.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.09,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 62.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 5.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 201.37,
|
|
"tps_std": 1.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.91,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 199.51,
|
|
"tps_std": 1.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.98,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 235.0,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.16,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.77,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 31.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 5.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 131.53,
|
|
"tps_std": 1.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.08,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 34.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 9.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 235.09,
|
|
"file_size_gib": 96.99,
|
|
"name_params_b": 235.09,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 489.1,
|
|
"tps_std": 3.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.1,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 282.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 491.47,
|
|
"tps_std": 1.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 271.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 14.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 491.95,
|
|
"tps_std": 0.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 336.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 492.47,
|
|
"tps_std": 3.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.15,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 318.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 567.78,
|
|
"tps_std": 2.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.92,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 268.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 18.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 575.99,
|
|
"tps_std": 6.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 255.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 18.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 576.13,
|
|
"tps_std": 3.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.13,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 30.0,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "hang",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 30.0,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 377.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 460.49,
|
|
"tps_std": 1.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.12,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 234.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 17.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 467.86,
|
|
"tps_std": 1.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 224.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 18.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 468.47,
|
|
"tps_std": 2.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 360.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 470.04,
|
|
"tps_std": 3.69,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 337.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 461.77,
|
|
"tps_std": 2.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 234.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 18.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 463.39,
|
|
"tps_std": 4.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 223.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 18.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 466.61,
|
|
"tps_std": 1.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 319.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 473.68,
|
|
"tps_std": 1.69,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 337.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 194.36,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.96,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 86.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 8.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 167.29,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.36,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 102.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3-30B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 8.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 56.89,
|
|
"name_params_b": 30.53,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 883.95,
|
|
"tps_std": 6.89,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 323.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 20.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 888.32,
|
|
"tps_std": 6.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 323.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 20.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 887.98,
|
|
"tps_std": 2.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 273.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 40.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 897.81,
|
|
"tps_std": 13.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.56,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 273.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 40.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1045.84,
|
|
"tps_std": 8.87,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 310.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 28.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1046.62,
|
|
"tps_std": 8.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.78,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 313.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 28.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1065.87,
|
|
"tps_std": 15.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.71,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 353.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1056.16,
|
|
"tps_std": 8.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.68,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 341.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 961.79,
|
|
"tps_std": 10.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.69,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 263.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 27.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 964.88,
|
|
"tps_std": 9.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.78,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 263.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 27.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 992.39,
|
|
"tps_std": 4.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.48,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 286.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 984.99,
|
|
"tps_std": 7.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.39,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 284.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 966.17,
|
|
"tps_std": 7.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.85,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 263.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 27.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 960.5,
|
|
"tps_std": 8.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.91,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 263.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 27.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 986.79,
|
|
"tps_std": 6.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.42,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 410.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 984.07,
|
|
"tps_std": 5.87,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 57.52,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 282.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1129.76,
|
|
"tps_std": 4.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 62.27,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 135.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 33.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 905.18,
|
|
"tps_std": 4.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 66.46,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 172.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 24.53,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1189.07,
|
|
"tps_std": 7.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 332.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 21.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1185.59,
|
|
"tps_std": 10.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.65,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 338.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 21.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1185.88,
|
|
"tps_std": 9.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.64,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 295.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 45.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1189.9,
|
|
"tps_std": 9.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 71.61,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 291.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 45.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1201.14,
|
|
"tps_std": 12.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.92,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 319.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 30.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1208.02,
|
|
"tps_std": 13.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.87,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 321.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 30.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1225.68,
|
|
"tps_std": 19.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.13,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 387.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 43.53,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1231.06,
|
|
"tps_std": 2.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.08,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 361.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 44.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1172.29,
|
|
"tps_std": 9.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.19,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 270.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 29.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1169.43,
|
|
"tps_std": 4.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.31,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 270.83,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 30.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1183.05,
|
|
"tps_std": 9.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.17,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 292.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 43.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1195.38,
|
|
"tps_std": 5.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.06,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 287.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 43.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1166.57,
|
|
"tps_std": 8.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.37,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 270.55,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 30.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1167.1,
|
|
"tps_std": 5.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 69.33,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 270.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 30.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1194.63,
|
|
"tps_std": 7.87,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.98,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 292.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 43.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1202.35,
|
|
"tps_std": 10.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.96,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 292.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 44.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 825.86,
|
|
"tps_std": 2.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 80.94,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 130.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 37.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 864.66,
|
|
"tps_std": 2.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 83.07,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 168.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 47.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 345.64,
|
|
"tps_std": 0.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.88,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 344.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 20.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 356.53,
|
|
"tps_std": 3.9,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.26,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 352.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 24.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 346.29,
|
|
"tps_std": 1.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.92,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 379.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 360.22,
|
|
"tps_std": 1.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 27.35,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 386.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 25.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 573.57,
|
|
"tps_std": 2.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 464.91,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 595.88,
|
|
"tps_std": 2.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.34,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 480.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 23.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 576.31,
|
|
"tps_std": 0.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 489.52,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 24.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 590.68,
|
|
"tps_std": 0.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.38,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 503.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 25.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 571.05,
|
|
"tps_std": 4.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.45,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 444.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 21.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 594.4,
|
|
"tps_std": 3.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 451.46,
|
|
"tps_std": 0.0,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 568.38,
|
|
"tps_std": 2.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.5,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 462.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 22.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 587.5,
|
|
"tps_std": 6.59,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 479.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 21.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 567.13,
|
|
"tps_std": 2.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.44,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 438.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 23.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 594.63,
|
|
"tps_std": 11.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.76,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 442.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 23.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 570.28,
|
|
"tps_std": 3.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.05,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 473.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 24.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 588.8,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 26.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 488.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 21.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 406.08,
|
|
"tps_std": 1.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 33.67,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 194.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 27.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 326.83,
|
|
"tps_std": 0.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.18,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 220.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002",
|
|
"model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 27.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 79.67,
|
|
"file_size_gib": 79.57,
|
|
"name_params_b": 79.67,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 421.94,
|
|
"tps_std": 0.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 332.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 11.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 424.57,
|
|
"tps_std": 0.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 325.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 11.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 429.89,
|
|
"tps_std": 0.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 309.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 430.69,
|
|
"tps_std": 0.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.25,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 338.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 897.73,
|
|
"tps_std": 0.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 288.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 904.28,
|
|
"tps_std": 1.51,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 290.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 913.75,
|
|
"tps_std": 0.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 425.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 919.42,
|
|
"tps_std": 0.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.19,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 430.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 886.59,
|
|
"tps_std": 0.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 303.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 890.97,
|
|
"tps_std": 0.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 304.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 910.34,
|
|
"tps_std": 0.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 391.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.8,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 917.22,
|
|
"tps_std": 0.99,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 394.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 882.81,
|
|
"tps_std": 0.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 302.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 891.69,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 306.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 913.03,
|
|
"tps_std": 1.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 399.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 917.06,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.27,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 391.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 690.02,
|
|
"tps_std": 1.72,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 54.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 549.78,
|
|
"tps_std": 1.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 13.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 270.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-3-12b-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 11.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 11.77,
|
|
"file_size_gib": 13.4,
|
|
"name_params_b": 11.77,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 468.46,
|
|
"tps_std": 1.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 167.6,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 522.97,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 170.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 477.16,
|
|
"tps_std": 1.86,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 237.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 527.33,
|
|
"tps_std": 1.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 270.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 468.3,
|
|
"tps_std": 0.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 167.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 525.67,
|
|
"tps_std": 0.68,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 169.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 472.62,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 246.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 530.96,
|
|
"tps_std": 0.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 285.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.86,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 463.74,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 193.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 522.71,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 205.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 466.55,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 234.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 526.17,
|
|
"tps_std": 0.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 269.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 462.78,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 194.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 499.88,
|
|
"tps_std": 0.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 195.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 474.02,
|
|
"tps_std": 0.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 308.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 506.0,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 4.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 320.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "load",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "load",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 107.99,
|
|
"tps_std": 1.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 67.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-27b-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-3-27b-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 3.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 27.01,
|
|
"file_size_gib": 50.31,
|
|
"name_params_b": 27.01,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2767.54,
|
|
"tps_std": 1.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.17,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1439.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 68.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2762.69,
|
|
"tps_std": 4.25,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.08,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1442.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 68.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2759.74,
|
|
"tps_std": 13.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 84.86,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1331.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 71.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2748.02,
|
|
"tps_std": 15.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 84.54,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1341.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 71.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2907.52,
|
|
"tps_std": 4.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.61,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1365.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 66.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2902.86,
|
|
"tps_std": 2.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.68,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1384.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 66.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2868.25,
|
|
"tps_std": 16.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 80.93,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1413.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 67.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2874.9,
|
|
"tps_std": 17.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.07,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1414.92,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 68.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2812.03,
|
|
"tps_std": 15.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.66,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1347.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 66.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2820.5,
|
|
"tps_std": 10.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.66,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1390.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 67.23,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2853.13,
|
|
"tps_std": 21.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.93,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1368.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 68.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2846.23,
|
|
"tps_std": 16.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.96,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1361.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 67.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2843.92,
|
|
"tps_std": 0.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.68,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1377.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 66.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2841.34,
|
|
"tps_std": 6.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 78.55,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1340.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 67.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2888.98,
|
|
"tps_std": 3.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.99,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1300.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 65.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 2874.43,
|
|
"tps_std": 2.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 81.99,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 1332.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 67.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1798.72,
|
|
"tps_std": 4.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 90.73,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 466.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 74.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1633.15,
|
|
"tps_std": 4.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 85.91,
|
|
"tps_std": 0.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 776.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-3-4b-it-Q3_K_S",
|
|
"model_clean": "gemma-3-4b-it-Q3_K_S",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 58.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 3.88,
|
|
"file_size_gib": 1.8,
|
|
"name_params_b": 3.88,
|
|
"quant": "Q3_K_S",
|
|
"log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 274.17,
|
|
"tps_std": 2.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 303.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 29.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 276.82,
|
|
"tps_std": 4.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.95,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 303.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 29.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 274.29,
|
|
"tps_std": 0.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.18,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 301.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 274.47,
|
|
"tps_std": 1.46,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.23,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 289.74,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 657.63,
|
|
"tps_std": 7.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 479.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 28.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 649.55,
|
|
"tps_std": 10.69,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 480.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 28.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 654.41,
|
|
"tps_std": 2.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 470.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 45.0,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 658.64,
|
|
"tps_std": 9.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 472.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 45.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 637.48,
|
|
"tps_std": 24.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.66,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 412.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 28.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 653.6,
|
|
"tps_std": 10.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 409.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 28.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 639.37,
|
|
"tps_std": 5.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 496.89,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 43.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 646.49,
|
|
"tps_std": 8.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.16,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 501.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 44.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 645.91,
|
|
"tps_std": 13.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.67,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 410.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 28.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 653.08,
|
|
"tps_std": 2.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.78,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 413.56,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 28.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 637.84,
|
|
"tps_std": 10.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.22,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 522.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 43.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 642.63,
|
|
"tps_std": 7.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.17,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 532.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 44.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 792.77,
|
|
"tps_std": 0.78,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 52.34,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 266.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 39.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 543.66,
|
|
"tps_std": 0.88,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 56.37,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 299.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 45.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 791.2,
|
|
"tps_std": 5.92,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.24,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 539.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 795.34,
|
|
"tps_std": 8.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.28,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 538.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 788.07,
|
|
"tps_std": 19.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.65,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 585.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 61.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 777.22,
|
|
"tps_std": 12.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 533.9,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 61.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1752.24,
|
|
"tps_std": 12.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.82,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 796.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.1,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1717.36,
|
|
"tps_std": 12.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 796.57,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1710.01,
|
|
"tps_std": 23.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 808.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 64.31,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1726.91,
|
|
"tps_std": 4.81,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 817.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 64.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1710.28,
|
|
"tps_std": 7.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.12,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 670.09,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.17,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1695.75,
|
|
"tps_std": 25.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.15,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 668.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1670.49,
|
|
"tps_std": 30.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.45,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 658.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 62.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1661.92,
|
|
"tps_std": 6.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.41,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 654.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 62.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1692.63,
|
|
"tps_std": 8.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 668.58,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1721.79,
|
|
"tps_std": 15.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 665.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 42.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1668.78,
|
|
"tps_std": 30.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 633.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 62.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1674.84,
|
|
"tps_std": 21.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.29,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 644.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 62.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1965.23,
|
|
"tps_std": 21.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 75.24,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 512.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 56.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1395.08,
|
|
"tps_std": 16.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 79.6,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 467.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 65.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1556.97,
|
|
"tps_std": 0.78,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.65,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 94.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 10.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1561.25,
|
|
"tps_std": 2.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.59,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 94.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 10.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1572.74,
|
|
"tps_std": 2.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.65,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 351.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 10.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1572.88,
|
|
"tps_std": 2.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.64,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 346.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 10.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7alpha__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1525.39,
|
|
"tps_std": 0.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.05,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 104.91,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1524.22,
|
|
"tps_std": 2.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.02,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 106.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1539.28,
|
|
"tps_std": 0.84,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 384.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1538.89,
|
|
"tps_std": 3.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.07,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 382.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 12.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1492.67,
|
|
"tps_std": 1.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.89,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 141.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-rocwmma",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.37,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1495.58,
|
|
"tps_std": 2.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.97,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 141.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-rocwmma-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1526.32,
|
|
"tps_std": 2.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.96,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 348.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.34,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1530.07,
|
|
"tps_std": 0.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.01,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 348.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7.1.1-hblt0",
|
|
"env_base": "rocm7.1.1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7.1.1__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1493.41,
|
|
"tps_std": 1.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.9,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 139.87,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1494.79,
|
|
"tps_std": 2.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.91,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 139.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.36,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc-rocwmma__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1529.76,
|
|
"tps_std": 1.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 350.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1530.14,
|
|
"tps_std": 1.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.88,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__hblt0__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 347.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 13.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7_rc__hblt0__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1494.56,
|
|
"tps_std": 4.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 56.03,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 196.22,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 15.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1135.49,
|
|
"tps_std": 4.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.73,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "pp2048 @ d16384",
|
|
"tps_mean": 294.01,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx16384",
|
|
"context_tokens": 16384,
|
|
"test": "tg32 @ d16384",
|
|
"tps_mean": 15.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx16384.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "2aa45ef9e",
|
|
"number": "7423"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 6.54,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 64.83,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.69,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 6.03,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 50.19,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 16.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 66.04,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 13.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.82,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 50.78,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-rocwmma-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 8.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-rocwmma-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-rocwmma-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 62.7,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-rocwmma-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.71,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-rocwmma",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 8.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-rocwmma",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-rocwmma",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 45.01,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-rocwmma",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "hblt0",
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 65.83,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 42.96,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_1",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_1__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 10.48,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 61.63,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.92,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 9.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 36.76,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.93,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma-improved__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 6.98,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 66.33,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.04,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 6.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 30.17,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.05,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 12.79,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 31.42,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.08,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_alpha__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 8.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 63.23,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.7,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 8.13,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 0.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 30.12,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 63.17,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.72,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 36.22,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005",
|
|
"model_clean": "GLM-4.6-UD-Q4_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.71,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 356.79,
|
|
"file_size_gib": 189.69,
|
|
"name_params_b": 356.79,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7_rc__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 20.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 172.03,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.02,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 20.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 174.52,
|
|
"tps_std": 1.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-rocwmma",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.94,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "caca0d55c",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 56.85,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 171.93,
|
|
"tps_std": 1.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4-hblt0",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.06,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 55.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 174.45,
|
|
"tps_std": 1.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.02,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "86f1f4411",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-rocwmma-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 29.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-rocwmma-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-rocwmma-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 170.89,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-rocwmma-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.89,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-rocwmma",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 28.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-rocwmma",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-rocwmma",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 173.53,
|
|
"tps_std": 1.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-rocwmma",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.92,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "f1840a25d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 61.44,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.68,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 172.01,
|
|
"tps_std": 0.91,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1-hblt0",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.95,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 59.64,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 173.9,
|
|
"tps_std": 0.67,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_1",
|
|
"env_base": "rocm7_1",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.95,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_1__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "677be4d78",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.46,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 142.82,
|
|
"tps_std": 0.78,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.85,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 34.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.47,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-improved",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-improved",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.86,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma-improved__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "12bb5c37",
|
|
"number": "7074"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.4,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 143.05,
|
|
"tps_std": 1.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.0,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 22.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 1.84,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 145.6,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-rocwmma",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.94,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4db63cdde",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 55.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 144.59,
|
|
"tps_std": 0.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha-hblt0",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.01,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 55.38,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.7,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 146.21,
|
|
"tps_std": 2.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm-7alpha",
|
|
"env_base": "rocm",
|
|
"env_variant": "7alpha",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.05,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_alpha__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "4fc43d43d",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 29.15,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 170.42,
|
|
"tps_std": 0.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma-hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.88,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 29.32,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 174.42,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-rocwmma",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "rocwmma",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.87,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc-rocwmma__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "b447a9a4b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 57.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.67,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__hblt0__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 171.34,
|
|
"tps_std": 0.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc-hblt0",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": "hblt0",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.97,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__hblt0__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__longctx32768__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 173.98,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "rocm7_rc",
|
|
"env_base": "rocm7_rc",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 17.94,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm,RPC",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 180.94,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7_rc__rpc.log",
|
|
"rpc": true,
|
|
"build": {
|
|
"hash": "fa5c85a8b",
|
|
"number": "7085"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2-UD-Q6_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": false,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q6_K_XL",
|
|
"log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_amdvlk__rpc.log",
|
|
"rpc": true,
|
|
"build": null
|
|
}
|
|
]
|
|
} |