Skip to content

Commit ac62a07

Browse files
authored
register kimi (#1483)
1 parent a50baaf commit ac62a07

File tree

1 file changed

+17
-2
lines changed

1 file changed

+17
-2
lines changed

src/modelgauge/suts/huggingface_chat_completion.py

Lines changed: 17 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -231,6 +231,14 @@ def translate_chat_prompt(self, prompt: ChatPrompt, options: ModelOptions) -> Hu
231231
)
232232

233233

234+
@modelgauge_sut(capabilities=[AcceptsTextPrompt, AcceptsChatPrompt])
235+
class HuggingFaceChatCompletionServerlessThinkingSUT(ThinkingMixin, HuggingFaceChatCompletionServerlessSUT):
236+
"""
237+
A SUT that excludes the reasoning from model output.
238+
Reasoning must be seperated from normal output with a </think> tag (like nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16)
239+
"""
240+
241+
234242
HF_SECRET = InjectSecret(HuggingFaceInferenceToken)
235243

236244
SUTS.register(
@@ -268,7 +276,7 @@ def translate_chat_prompt(self, prompt: ChatPrompt, options: ModelOptions) -> Hu
268276
None,
269277
HF_SECRET,
270278
)
271-
# Special thinking SUT
279+
# Special thinking dedicated SUTs
272280
SUTS.register(
273281
HuggingFaceChatCompletionDedicatedThinkingSUT,
274282
"nvidia-nemotron-3-nano-30b-a-thinking-excluded-hf",
@@ -283,7 +291,14 @@ def translate_chat_prompt(self, prompt: ChatPrompt, options: ModelOptions) -> Hu
283291
"PrimeIntellect/INTELLECT-3",
284292
HF_SECRET,
285293
)
286-
294+
# Special thinking serverless SUTs
295+
SUTS.register(
296+
HuggingFaceChatCompletionServerlessThinkingSUT,
297+
"moonshotai/Kimi-K2.5-together-thinking-excluded-hf",
298+
"moonshotai/Kimi-K2.5",
299+
"together",
300+
HF_SECRET,
301+
)
287302
# Register serverless SUTs.
288303
SUTS.register(
289304
HuggingFaceChatCompletionServerlessSUT,

0 commit comments

Comments
 (0)