Merge pull request #5 from chupark/pcw_openai_compatible

chupark · web-flow · commit e651b6eba99e · 2025-10-30T22:59:07.000+09:00
diff --git a/python/dify_plugin/entities/model/__init__.py b/python/dify_plugin/entities/model/__init__.py
@@ -22,6 +22,7 @@ class DefaultParameterName(Enum):
     PRESENCE_PENALTY = "presence_penalty"
     FREQUENCY_PENALTY = "frequency_penalty"
     MAX_TOKENS = "max_tokens"
+    MAX_COMPLETION_TOKENS = "max_completion_tokens"
     RESPONSE_FORMAT = "response_format"
     JSON_SCHEMA = "json_schema"
 
diff --git a/python/dify_plugin/interfaces/model/openai_compatible/llm.py b/python/dify_plugin/interfaces/model/openai_compatible/llm.py
@@ -180,7 +180,11 @@ def validate_credentials(self, model: str, credentials: dict) -> None:
                 endpoint_url += "/"
 
             # prepare the payload for a simple ping to the model
-            data = {"model": credentials.get("endpoint_model_name", model), "max_tokens": 5}
+            if credentials.get("reasoning_thought_support") == "supported":
+                # for reasoning thought support, they use max_completion_tokens
+                data = {"model": credentials.get("endpoint_model_name", model), "max_completion_tokens": 5}
+            else:
+                data = {"model": credentials.get("endpoint_model_name", model), "max_tokens": 5}
 
             completion_type = LLMMode.value_of(credentials["mode"])
 
@@ -256,6 +260,14 @@ def get_customizable_model_schema(self, model: str, credentials: dict) -> AIMode
         """
         features = []
 
+        # for reasoning thought support, they use max_completion_tokens
+        if credentials.get("reasoning_thought_support") == "supported":
+            max_token_param_name = DefaultParameterName.MAX_COMPLETION_TOKENS.value
+            max_token_param_label = "Max Completion Tokens"
+        else:
+            max_token_param_name = DefaultParameterName.MAX_TOKENS.value
+            max_token_param_label = "Max Tokens"
+
         function_calling_type = credentials.get("function_calling_type", "no_call")
         if function_calling_type == "function_call":
             features.append(ModelFeature.TOOL_CALL)
@@ -338,8 +350,8 @@ def get_customizable_model_schema(self, model: str, credentials: dict) -> AIMode
                     max=2,
                 ),
                 ParameterRule(
-                    name=DefaultParameterName.MAX_TOKENS.value,
-                    label=I18nObject(en_US="Max Tokens", zh_Hans="最大标记"),
+                    name=max_token_param_name,
+                    label=I18nObject(en_US=max_token_param_label, zh_Hans="最大标记"),
                     help=I18nObject(
                         en_US="Maximum length of tokens for the model response.",
                         zh_Hans="模型回答的tokens的最大长度。",