@@ -231,6 +231,14 @@ def translate_chat_prompt(self, prompt: ChatPrompt, options: ModelOptions) -> Hu
231231 )
232232
233233
234+ @modelgauge_sut (capabilities = [AcceptsTextPrompt , AcceptsChatPrompt ])
235+ class HuggingFaceChatCompletionServerlessThinkingSUT (ThinkingMixin , HuggingFaceChatCompletionServerlessSUT ):
236+ """
237+ A SUT that excludes the reasoning from model output.
238+ Reasoning must be seperated from normal output with a </think> tag (like nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16)
239+ """
240+
241+
234242HF_SECRET = InjectSecret (HuggingFaceInferenceToken )
235243
236244SUTS .register (
@@ -268,7 +276,7 @@ def translate_chat_prompt(self, prompt: ChatPrompt, options: ModelOptions) -> Hu
268276 None ,
269277 HF_SECRET ,
270278 )
271- # Special thinking SUT
279+ # Special thinking dedicated SUTs
272280SUTS .register (
273281 HuggingFaceChatCompletionDedicatedThinkingSUT ,
274282 "nvidia-nemotron-3-nano-30b-a-thinking-excluded-hf" ,
@@ -283,7 +291,14 @@ def translate_chat_prompt(self, prompt: ChatPrompt, options: ModelOptions) -> Hu
283291 "PrimeIntellect/INTELLECT-3" ,
284292 HF_SECRET ,
285293)
286-
294+ # Special thinking serverless SUTs
295+ SUTS .register (
296+ HuggingFaceChatCompletionServerlessThinkingSUT ,
297+ "moonshotai/Kimi-K2.5-together-thinking-excluded-hf" ,
298+ "moonshotai/Kimi-K2.5" ,
299+ "together" ,
300+ HF_SECRET ,
301+ )
287302# Register serverless SUTs.
288303SUTS .register (
289304 HuggingFaceChatCompletionServerlessSUT ,
0 commit comments