convert : set "add bos" == True for Gemma 4 (ggml-org#21500)

ggerganov · icex · commit 7a22c32e4e2f · 2026-04-12T23:38:02.000+03:00
* convert : set "add bos" == True for Gemma 4

* cont : handle old GGUFs
diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py
@@ -7472,7 +7472,7 @@ def set_vocab(self):
         special_vocab = gguf.SpecialVocab(self.dir_model, load_merges=True)
         special_vocab.add_to_gguf(self.gguf_writer)
         self.gguf_writer.add_add_space_prefix(False)
-        self.gguf_writer.add_add_bos_token(False) # already added via the chat template
+        self.gguf_writer.add_add_bos_token(True)
 
     def set_gguf_parameters(self):
         super().set_gguf_parameters()
diff --git a/src/llama-vocab.cpp b/src/llama-vocab.cpp
@@ -2325,6 +2325,14 @@ void llama_vocab::impl::load(llama_model_loader & ml, const LLM_KV & kv) {
             if (ml.get_key(LLM_KV_TOKENIZER_ADD_SEP, temp, false)) {
                 add_sep = temp;
             }
+
+            // workaround for Gemma 4
+            // ref: https://github.com/ggml-org/llama.cpp/pull/21500
+            if (pre_type == LLAMA_VOCAB_PRE_TYPE_GEMMA4 && !add_bos) {
+                add_bos = true;
+
+                LLAMA_LOG_WARN("%s: override '%s' to 'true' for Gemma4\n", __func__, kv(LLM_KV_TOKENIZER_ADD_BOS).c_str());
+            }
         }
 
         // auto-detect special tokens by text

Original file line number	Diff line number	Diff line change
`@@ -2325,6 +2325,14 @@ void llama_vocab::impl::load(llama_model_loader & ml, const LLM_KV & kv) {`
`2325`	`2325`	`if (ml.get_key(LLM_KV_TOKENIZER_ADD_SEP, temp, false)) {`
`2326`	`2326`	`add_sep = temp;`
`2327`	`2327`	`}`
	`2328`	`+`
	`2329`	`+ // workaround for Gemma 4`
	`2330`	`+ // ref: https://github.com/ggml-org/llama.cpp/pull/21500`
	`2331`	`+ if (pre_type == LLAMA_VOCAB_PRE_TYPE_GEMMA4 && !add_bos) {`
	`2332`	`+ add_bos = true;`
	`2333`	`+`
	`2334`	`+ LLAMA_LOG_WARN("%s: override '%s' to 'true' for Gemma4\n", __func__, kv(LLM_KV_TOKENIZER_ADD_BOS).c_str());`
	`2335`	`+ }`
`2328`	`2336`	`}`
`2329`	`2337`
`2330`	`2338`	`// auto-detect special tokens by text`