We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ba2704a commit 820b353Copy full SHA for 820b353
tools/server/utils.hpp
@@ -749,6 +749,10 @@ static json oaicompat_completion_params_parse(
749
throw std::runtime_error("Cannot have 2 or more assistant messages at the end of the list.");
750
}
751
752
+ if(inputs.chat_template_kwargs.find("enable_thinking") != inputs.chat_template_kwargs.end()) {
753
+ throw std::runtime_error("Assistant response prefill is incompatible with enable_thinking.");
754
+ }
755
+
756
inputs.extract_reasoning = false;
757
inputs.add_generation_prompt = true;
758
0 commit comments