chat: Allow reasoning_content to be passed back

tarruda · tarruda · commit de4343aab626 · 2025-11-02T07:12:15.000-03:00
This makes it possible for reasoning_content to be passed back to llama-server,
which is useful for LLMs like GPT-OSS or Minimax-M2 that were trained for this.
diff --git a/common/chat.cpp b/common/chat.cpp
@@ -201,6 +201,7 @@ std::vector<common_chat_msg> common_chat_msgs_parse_oaicompat(const json & messa
             msg.role = message.at("role");
 
             auto has_content = message.contains("content");
+            auto has_reasoning_content = message.contains("reasoning_content");
             auto has_tool_calls = message.contains("tool_calls");
             if (has_content) {
                 const auto & content = message.at("content");
@@ -249,8 +250,8 @@ std::vector<common_chat_msg> common_chat_msgs_parse_oaicompat(const json & messa
                     msg.tool_calls.push_back(tc);
                 }
             }
-            if (!has_content && !has_tool_calls) {
-                throw std::runtime_error("Expected 'content' or 'tool_calls' (ref: https://github.com/ggml-org/llama.cpp/issues/8367 & https://github.com/ggml-org/llama.cpp/issues/12279)");
+            if (!has_content && !has_tool_calls && !has_reasoning_content) {
+                throw std::runtime_error("Expected 'content', 'reasoning_content' or 'tool_calls' (ref: https://github.com/ggml-org/llama.cpp/issues/8367 & https://github.com/ggml-org/llama.cpp/issues/12279)");
             }
             if (message.contains("reasoning_content")) {
                 msg.reasoning_content = message.at("reasoning_content");
diff --git a/tools/server/utils.hpp b/tools/server/utils.hpp
@@ -595,8 +595,8 @@ static json oaicompat_chat_params_parse(
             throw std::runtime_error("All non-assistant messages must contain 'content'");
         }
         if (role == "assistant") {
-            if (!msg.contains("content") && !msg.contains("tool_calls")) {
-                throw std::runtime_error("Assistant message must contain either 'content' or 'tool_calls'!");
+            if (!msg.contains("content") && !msg.contains("tool_calls") && !msg.contains("reasoning_content")) {
+                throw std::runtime_error("Assistant message must contain either 'content' or 'tool_calls' or 'reasoning_content'!");
             }
             if (!msg.contains("content")) {
                 continue; // avoid errors with no content

Original file line number	Diff line number	Diff line change
`@@ -201,6 +201,7 @@ std::vector<common_chat_msg> common_chat_msgs_parse_oaicompat(const json & messa`
`201`	`201`	`msg.role = message.at("role");`
`202`	`202`
`203`	`203`	`auto has_content = message.contains("content");`
	`204`	`+ auto has_reasoning_content = message.contains("reasoning_content");`
`204`	`205`	`auto has_tool_calls = message.contains("tool_calls");`
`205`	`206`	`if (has_content) {`
`206`	`207`	`const auto & content = message.at("content");`
`@@ -249,8 +250,8 @@ std::vector<common_chat_msg> common_chat_msgs_parse_oaicompat(const json & messa`
`249`	`250`	`msg.tool_calls.push_back(tc);`
`250`	`251`	`}`
`251`	`252`	`}`
`252`		`- if (!has_content && !has_tool_calls) {`
`253`		`- throw std::runtime_error("Expected 'content' or 'tool_calls' (ref: https://github.com/ggml-org/llama.cpp/issues/8367 & https://github.com/ggml-org/llama.cpp/issues/12279)");`
	`253`	`+ if (!has_content && !has_tool_calls && !has_reasoning_content) {`
	`254`	`+ throw std::runtime_error("Expected 'content', 'reasoning_content' or 'tool_calls' (ref: https://github.com/ggml-org/llama.cpp/issues/8367 & https://github.com/ggml-org/llama.cpp/issues/12279)");`
`254`	`255`	`}`
`255`	`256`	`if (message.contains("reasoning_content")) {`
`256`	`257`	`msg.reasoning_content = message.at("reasoning_content");`
Original file line number	Diff line number	Diff line change
`@@ -595,8 +595,8 @@ static json oaicompat_chat_params_parse(`
`595`	`595`	`throw std::runtime_error("All non-assistant messages must contain 'content'");`
`596`	`596`	`}`
`597`	`597`	`if (role == "assistant") {`
`598`		`- if (!msg.contains("content") && !msg.contains("tool_calls")) {`
`599`		`- throw std::runtime_error("Assistant message must contain either 'content' or 'tool_calls'!");`
	`598`	`+ if (!msg.contains("content") && !msg.contains("tool_calls") && !msg.contains("reasoning_content")) {`
	`599`	`+ throw std::runtime_error("Assistant message must contain either 'content' or 'tool_calls' or 'reasoning_content'!");`
`600`	`600`	`}`
`601`	`601`	`if (!msg.contains("content")) {`
`602`	`602`	`continue; // avoid errors with no content`