From 14fae26ad0f790e5fcb3ea1eee71d97d8a7164fa Mon Sep 17 00:00:00 2001 From: Donato Capitella Date: Wed, 15 Apr 2026 08:08:43 +0100 Subject: [PATCH] add minimax m2.7 benchmarks --- ...3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log | 8 + ...f-00004__rocm-7_2_1__fa1__longctx32768.log | 8 + ...Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log | 8 + ...of-00004__rocm6_4_4__fa1__longctx32768.log | 8 + ...L-00001-of-00004__rocm7-nightlies__fa1.log | 8 + ...04__rocm7-nightlies__fa1__longctx32768.log | 8 + ..._XL-00001-of-00004__vulkan_amdvlk__fa1.log | 8 + ...0004__vulkan_amdvlk__fa1__longctx32768.log | 8 + ..._K_XL-00001-of-00004__vulkan_radv__fa1.log | 8 + ...-00004__vulkan_radv__fa1__longctx32768.log | 8 + docs/results.json | 566 +++++++++++++++++- 11 files changed, 645 insertions(+), 1 deletion(-) create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log create mode 100644 benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log new file mode 100644 index 0000000..4cd2596 --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log @@ -0,0 +1,8 @@ +ggml_cuda_init: found 1 ROCm devices (Total VRAM: 126976 MiB): + Device 0: Radeon 8060S Graphics, gfx1151 (0x1151), VMM: no, Wave Size: 32, VRAM: 126976 MiB +| model | size | params | backend | ngl | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 1 | 0 | pp512 | 245.94 ± 1.48 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 1 | 0 | tg128 | 24.11 ± 0.05 | + +build: ff5ef8278 (8763) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log new file mode 100644 index 0000000..243dd87 --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log @@ -0,0 +1,8 @@ +ggml_cuda_init: found 1 ROCm devices (Total VRAM: 126976 MiB): + Device 0: Radeon 8060S Graphics, gfx1151 (0x1151), VMM: no, Wave Size: 32, VRAM: 126976 MiB +| model | size | params | backend | ngl | n_ubatch | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -------: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 2048 | 1 | 0 | pp2048 @ d32768 | 66.09 ± 0.53 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 2048 | 1 | 0 | tg32 @ d32768 | 6.32 ± 0.05 | + +build: ff5ef8278 (8763) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log new file mode 100644 index 0000000..3f5143a --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log @@ -0,0 +1,8 @@ +ggml_cuda_init: found 1 ROCm devices (Total VRAM: 126976 MiB): + Device 0: Radeon 8060S Graphics, gfx1151 (0x1151), VMM: no, Wave Size: 32, VRAM: 126976 MiB +| model | size | params | backend | ngl | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 1 | 0 | pp512 | 245.63 ± 1.62 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 1 | 0 | tg128 | 22.63 ± 0.07 | + +build: 3f8752b55 (8743) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log new file mode 100644 index 0000000..2282246 --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log @@ -0,0 +1,8 @@ +ggml_cuda_init: found 1 ROCm devices (Total VRAM: 126976 MiB): + Device 0: Radeon 8060S Graphics, gfx1151 (0x1151), VMM: no, Wave Size: 32, VRAM: 126976 MiB +| model | size | params | backend | ngl | n_ubatch | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -------: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 2048 | 1 | 0 | pp2048 @ d32768 | 79.52 ± 0.47 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 2048 | 1 | 0 | tg32 @ d32768 | 6.69 ± 0.15 | + +build: 3f8752b55 (8743) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log new file mode 100644 index 0000000..41d8882 --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log @@ -0,0 +1,8 @@ +ggml_cuda_init: found 1 ROCm devices (Total VRAM: 126976 MiB): + Device 0: Radeon 8060S Graphics, gfx1151 (0x1151), VMM: no, Wave Size: 32, VRAM: 126976 MiB +| model | size | params | backend | ngl | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 1 | 0 | pp512 | 237.43 ± 0.96 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 1 | 0 | tg128 | 22.63 ± 0.05 | + +build: 3f8752b55 (8743) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log new file mode 100644 index 0000000..2090c73 --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log @@ -0,0 +1,8 @@ +ggml_cuda_init: found 1 ROCm devices (Total VRAM: 126976 MiB): + Device 0: Radeon 8060S Graphics, gfx1151 (0x1151), VMM: no, Wave Size: 32, VRAM: 126976 MiB +| model | size | params | backend | ngl | n_ubatch | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -------: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 2048 | 1 | 0 | pp2048 @ d32768 | 61.53 ± 0.27 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | ROCm | 99 | 2048 | 1 | 0 | tg32 @ d32768 | 6.52 ± 0.17 | + +build: 3f8752b55 (8743) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log new file mode 100644 index 0000000..a893a6a --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log @@ -0,0 +1,8 @@ +ggml_vulkan: Found 1 Vulkan devices: +ggml_vulkan: 0 = Radeon 8060S Graphics (AMD open-source driver) | uma: 1 | fp16: 1 | bf16: 0 | warp size: 64 | shared memory: 32768 | int dot: 1 | matrix cores: KHR_coopmat +| model | size | params | backend | ngl | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | Vulkan | 99 | 1 | 0 | pp512 | 203.53 ± 0.70 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | Vulkan | 99 | 1 | 0 | tg128 | 24.06 ± 0.03 | + +build: 3f8752b55 (8743) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log new file mode 100644 index 0000000..3cd97d8 --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log @@ -0,0 +1,8 @@ +ggml_vulkan: Found 1 Vulkan devices: +ggml_vulkan: 0 = Radeon 8060S Graphics (AMD open-source driver) | uma: 1 | fp16: 1 | bf16: 0 | warp size: 64 | shared memory: 32768 | int dot: 1 | matrix cores: KHR_coopmat +| model | size | params | backend | ngl | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | Vulkan | 99 | 1 | 0 | pp2048 @ d32768 | 31.94 ± 0.07 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | Vulkan | 99 | 1 | 0 | tg32 @ d32768 | 10.05 ± 0.01 | + +build: 3f8752b55 (8743) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log new file mode 100644 index 0000000..0f184ff --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log @@ -0,0 +1,8 @@ +ggml_vulkan: Found 1 Vulkan devices: +ggml_vulkan: 0 = Radeon 8060S Graphics (RADV GFX1151) (radv) | uma: 1 | fp16: 1 | bf16: 0 | warp size: 64 | shared memory: 65536 | int dot: 1 | matrix cores: KHR_coopmat +| model | size | params | backend | ngl | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | Vulkan | 99 | 1 | 0 | pp512 | 234.24 ± 1.27 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | Vulkan | 99 | 1 | 0 | tg128 | 29.48 ± 0.01 | + +build: 3f8752b55 (8743) diff --git a/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log new file mode 100644 index 0000000..8cb49dc --- /dev/null +++ b/benchmark/results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log @@ -0,0 +1,8 @@ +ggml_vulkan: Found 1 Vulkan devices: +ggml_vulkan: 0 = Radeon 8060S Graphics (RADV GFX1151) (radv) | uma: 1 | fp16: 1 | bf16: 0 | warp size: 64 | shared memory: 65536 | int dot: 1 | matrix cores: KHR_coopmat +| model | size | params | backend | ngl | fa | mmap | test | t/s | +| ------------------------------ | ---------: | ---------: | ---------- | --: | -: | ---: | --------------: | -------------------: | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | Vulkan | 99 | 1 | 0 | pp2048 @ d32768 | 32.31 ± 0.16 | +| minimax-m2 230B.A10B Q3_K - Medium | 94.93 GiB | 228.69 B | Vulkan | 99 | 1 | 0 | tg32 @ d32768 | 14.20 ± 0.01 | + +build: 3f8752b55 (8743) diff --git a/docs/results.json b/docs/results.json index f9933b5..2facb03 100644 --- a/docs/results.json +++ b/docs/results.json @@ -1,6 +1,6 @@ { "meta": { - "generated_at": "2026-04-11T10:20:08Z", + "generated_at": "2026-04-15T07:08:17Z", "system_info": { "distro": "Fedora Linux 43 (Workstation Edition)", "kernel": "6.19.9-200.fc43.x86_64", @@ -11,6 +11,10 @@ { "hash": "3f8752b55", "number": "8743" + }, + { + "hash": "ff5ef8278", + "number": "8763" } ], "environments": [ @@ -1636,6 +1640,566 @@ "number": "8743" } }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm-7_2_1", + "env_base": "rocm", + "env_variant": "7_2_1", + "fa": true, + "context": "default", + "context_tokens": null, + "test": "pp512", + "tps_mean": 245.94, + "tps_std": 1.48, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log", + "rpc": false, + "build": { + "hash": "ff5ef8278", + "number": "8763" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm-7_2_1", + "env_base": "rocm", + "env_variant": "7_2_1", + "fa": true, + "context": "default", + "context_tokens": null, + "test": "tg128", + "tps_mean": 24.11, + "tps_std": 0.05, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log", + "rpc": false, + "build": { + "hash": "ff5ef8278", + "number": "8763" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm-7_2_1", + "env_base": "rocm", + "env_variant": "7_2_1", + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "pp2048 @ d32768", + "tps_mean": 66.09, + "tps_std": 0.53, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "ff5ef8278", + "number": "8763" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm-7_2_1", + "env_base": "rocm", + "env_variant": "7_2_1", + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "tg32 @ d32768", + "tps_mean": 6.32, + "tps_std": 0.05, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "ff5ef8278", + "number": "8763" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm6_4_4", + "env_base": "rocm6_4_4", + "env_variant": null, + "fa": true, + "context": "default", + "context_tokens": null, + "test": "pp512", + "tps_mean": 245.63, + "tps_std": 1.62, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm6_4_4", + "env_base": "rocm6_4_4", + "env_variant": null, + "fa": true, + "context": "default", + "context_tokens": null, + "test": "tg128", + "tps_mean": 22.63, + "tps_std": 0.07, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm6_4_4", + "env_base": "rocm6_4_4", + "env_variant": null, + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "pp2048 @ d32768", + "tps_mean": 79.52, + "tps_std": 0.47, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm6_4_4", + "env_base": "rocm6_4_4", + "env_variant": null, + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "tg32 @ d32768", + "tps_mean": 6.69, + "tps_std": 0.15, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm7-nightlies", + "env_base": "rocm7", + "env_variant": "nightlies", + "fa": true, + "context": "default", + "context_tokens": null, + "test": "pp512", + "tps_mean": 237.43, + "tps_std": 0.96, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm7-nightlies", + "env_base": "rocm7", + "env_variant": "nightlies", + "fa": true, + "context": "default", + "context_tokens": null, + "test": "tg128", + "tps_mean": 22.63, + "tps_std": 0.05, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm7-nightlies", + "env_base": "rocm7", + "env_variant": "nightlies", + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "pp2048 @ d32768", + "tps_mean": 61.53, + "tps_std": 0.27, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "rocm7-nightlies", + "env_base": "rocm7", + "env_variant": "nightlies", + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "tg32 @ d32768", + "tps_mean": 6.52, + "tps_std": 0.17, + "error": false, + "error_type": null, + "backend": "ROCm", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "vulkan_amdvlk", + "env_base": "vulkan_amdvlk", + "env_variant": null, + "fa": true, + "context": "default", + "context_tokens": null, + "test": "pp512", + "tps_mean": 203.53, + "tps_std": 0.7, + "error": false, + "error_type": null, + "backend": "Vulkan", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "vulkan_amdvlk", + "env_base": "vulkan_amdvlk", + "env_variant": null, + "fa": true, + "context": "default", + "context_tokens": null, + "test": "tg128", + "tps_mean": 24.06, + "tps_std": 0.03, + "error": false, + "error_type": null, + "backend": "Vulkan", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "vulkan_amdvlk", + "env_base": "vulkan_amdvlk", + "env_variant": null, + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "pp2048 @ d32768", + "tps_mean": 31.94, + "tps_std": 0.07, + "error": false, + "error_type": null, + "backend": "Vulkan", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "vulkan_amdvlk", + "env_base": "vulkan_amdvlk", + "env_variant": null, + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "tg32 @ d32768", + "tps_mean": 10.05, + "tps_std": 0.01, + "error": false, + "error_type": null, + "backend": "Vulkan", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "vulkan_radv", + "env_base": "vulkan_radv", + "env_variant": null, + "fa": true, + "context": "default", + "context_tokens": null, + "test": "pp512", + "tps_mean": 234.24, + "tps_std": 1.27, + "error": false, + "error_type": null, + "backend": "Vulkan", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "vulkan_radv", + "env_base": "vulkan_radv", + "env_variant": null, + "fa": true, + "context": "default", + "context_tokens": null, + "test": "tg128", + "tps_mean": 29.48, + "tps_std": 0.01, + "error": false, + "error_type": null, + "backend": "Vulkan", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "vulkan_radv", + "env_base": "vulkan_radv", + "env_variant": null, + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "pp2048 @ d32768", + "tps_mean": 32.31, + "tps_std": 0.16, + "error": false, + "error_type": null, + "backend": "Vulkan", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, + { + "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", + "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", + "env": "vulkan_radv", + "env_base": "vulkan_radv", + "env_variant": null, + "fa": true, + "context": "longctx32768", + "context_tokens": 32768, + "test": "tg32 @ d32768", + "tps_mean": 14.2, + "tps_std": 0.01, + "error": false, + "error_type": null, + "backend": "Vulkan", + "ngl": 99, + "mmap": 0, + "params_b": 228.69, + "file_size_gib": 94.93, + "name_params_b": 228.69, + "quant": "Q3_K_XL", + "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log", + "rpc": false, + "build": { + "hash": "3f8752b55", + "number": "8743" + } + }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16",