Skip to content

Commit 35ae992

Browse files
authored
llama-bench: print -n-cpu-moe when offloaded layers > 1 (ggml-org#20984)
1 parent a1d4c18 commit 35ae992

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

tools/llama-bench/llama-bench.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1807,7 +1807,7 @@ struct markdown_printer : public printer {
18071807
if (!is_cpu_backend) {
18081808
fields.emplace_back("n_gpu_layers");
18091809
}
1810-
if (params.n_cpu_moe.size() > 1) {
1810+
if (params.n_cpu_moe.size() > 1 || params.n_cpu_moe != cmd_params_defaults.n_cpu_moe) {
18111811
fields.emplace_back("n_cpu_moe");
18121812
}
18131813
if (params.n_threads.size() > 1 || params.n_threads != cmd_params_defaults.n_threads || is_cpu_backend) {

0 commit comments

Comments
 (0)