gpt-oss : set special tokens back to user defined

aldehir · aldehir · commit 04e162607a17 · 2025-08-11T20:45:45.000-05:00
diff --git a/src/llama-vocab.cpp b/src/llama-vocab.cpp
@@ -2339,6 +2339,13 @@ void llama_vocab::impl::load(llama_model_loader & ml, const LLM_KV & kv) {
             }
         }
 
+        // @ngxson : quick hack for gpt-oss, always render these tokens
+        for (const auto & t : token_to_id) {
+            if (t.first == "<|channel|>" || t.first == "<|message|>" || t.first == "<|start|>" || t.first == "<|constrain|>") {
+                id_to_token[t.second].attr = LLAMA_TOKEN_ATTR_USER_DEFINED;
+            }
+        }
+
         // sanity checks
         if (special_eos_id != LLAMA_TOKEN_NULL && special_eog_ids.count(special_eos_id) == 0) {
             special_eog_ids.insert(special_eos_id);
@@ -2381,6 +2388,7 @@ void llama_vocab::impl::load(llama_model_loader & ml, const LLM_KV & kv) {
 
             if (has_return && has_call && has_end) {
                 special_eog_ids.erase(end_id);
+                id_to_token[end_id].attr = LLAMA_TOKEN_ATTR_USER_DEFINED;
                 LLAMA_LOG_WARN("%s: special_eog_ids contains both '<|return|>' and '<|call|>' tokens, removing '<|end|>' token from EOG list\n", __func__);
             }
         }

Original file line number	Diff line number	Diff line change
`@@ -2339,6 +2339,13 @@ void llama_vocab::impl::load(llama_model_loader & ml, const LLM_KV & kv) {`
`2339`	`2339`	`}`
`2340`	`2340`	`}`
`2341`	`2341`
	`2342`	`+ // @ngxson : quick hack for gpt-oss, always render these tokens`
	`2343`	`+ for (const auto & t : token_to_id) {`
	`2344`	`+ if (t.first == "<\|channel\|>" \|\| t.first == "<\|message\|>" \|\| t.first == "<\|start\|>" \|\| t.first == "<\|constrain\|>") {`
	`2345`	`+ id_to_token[t.second].attr = LLAMA_TOKEN_ATTR_USER_DEFINED;`
	`2346`	`+ }`
	`2347`	`+ }`
	`2348`	`+`
`2342`	`2349`	`// sanity checks`
`2343`	`2350`	`if (special_eos_id != LLAMA_TOKEN_NULL && special_eog_ids.count(special_eos_id) == 0) {`
`2344`	`2351`	`special_eog_ids.insert(special_eos_id);`
`@@ -2381,6 +2388,7 @@ void llama_vocab::impl::load(llama_model_loader & ml, const LLM_KV & kv) {`
`2381`	`2388`
`2382`	`2389`	`if (has_return && has_call && has_end) {`
`2383`	`2390`	`special_eog_ids.erase(end_id);`
	`2391`	`+ id_to_token[end_id].attr = LLAMA_TOKEN_ATTR_USER_DEFINED;`
`2384`	`2392`	`LLAMA_LOG_WARN("%s: special_eog_ids contains both '<\|return\|>' and '<\|call\|>' tokens, removing '<\|end\|>' token from EOG list\n", __func__);`
`2385`	`2393`	`}`
`2386`	`2394`	`}`