langchain-ai
diff --git a/‎libs/ibm/langchain_ibm/chat_models.py
Lines changed: 116 additions & 44 deletions b/‎libs/ibm/langchain_ibm/chat_models.py
Lines changed: 116 additions & 44 deletions
diff --git a/‎libs/ibm/poetry.lock
Lines changed: 24 additions & 14 deletions b/‎libs/ibm/poetry.lock
Lines changed: 24 additions & 14 deletions
diff --git a/‎libs/ibm/pyproject.toml
Lines changed: 2 additions & 2 deletions b/‎libs/ibm/pyproject.toml
Lines changed: 2 additions & 2 deletions
diff --git a/‎libs/ibm/tests/integration_tests/test_chat_models.py
Lines changed: 2 additions & 1 deletion b/‎libs/ibm/tests/integration_tests/test_chat_models.py
Lines changed: 2 additions & 1 deletion
@@ -28,6 +28,7 @@
     BaseSchema,
     TextChatParameters,
 )
+from ibm_watsonx_ai.gateway import Gateway  # type: ignore
 from langchain_core.callbacks import (
     AsyncCallbackManagerForLLMRun,
     CallbackManagerForLLMRun,
@@ -428,6 +429,9 @@ class ChatWatsonx(BaseChatModel):
     model_id: Optional[str] = None
     """Type of model to use."""
 
+    model: Optional[str] = None
+    """Name of model for given provider or alias."""
+
     deployment_id: Optional[str] = None
     """Type of deployed model to use."""
 
@@ -558,6 +562,10 @@ class ChatWatsonx(BaseChatModel):
 
     watsonx_model: ModelInference = Field(default=None, exclude=True)  #: :meta private:
 
+    watsonx_model_gateway: Gateway = Field(
+        default=None, exclude=True
+    )  #: :meta private:
+
     watsonx_client: Optional[APIClient] = Field(default=None, exclude=True)
 
     model_config = ConfigDict(populate_by_name=True)
@@ -624,21 +632,58 @@ def validate_environment(self) -> Self:
                 if v is not None
             }
         )
+        if self.watsonx_model_gateway is not None:
+            raise NotImplementedError(
+                "Passing the 'watsonx_model_gateway' parameter to the ChatWatsonx "
+                "constructor is not supported yet."
+            )
 
-        if isinstance(self.watsonx_client, APIClient):
-            watsonx_model = ModelInference(
-                model_id=self.model_id,
-                deployment_id=self.deployment_id,
-                params=self.params,
-                api_client=self.watsonx_client,
-                project_id=self.project_id,
-                space_id=self.space_id,
-                verify=self.verify,
-                validate=self.validate_model,
+        if isinstance(self.watsonx_model, ModelInference):
+            self.model_id = getattr(self.watsonx_model, "model_id")
+            self.deployment_id = getattr(self.watsonx_model, "deployment_id", "")
+            self.project_id = getattr(
+                getattr(self.watsonx_model, "_client"),
+                "default_project_id",
+            )
+            self.space_id = getattr(
+                getattr(self.watsonx_model, "_client"), "default_space_id"
             )
-            self.watsonx_model = watsonx_model
+            self.params = getattr(self.watsonx_model, "params")
+            self.watsonx_client = getattr(self.watsonx_model, "_client")
 
+        elif isinstance(self.watsonx_client, APIClient):
+            if sum(map(bool, (self.model, self.model_id, self.deployment_id))) != 1:
+                raise ValueError(
+                    "The parameters 'model', 'model_id' and 'deployment_id' are "
+                    "mutually exclusive. Please specify exactly one of these "
+                    "parameters when initializing ChatWatsonx."
+                )
+            if self.model is not None:
+                watsonx_model_gateway = Gateway(
+                    api_client=self.watsonx_client,
+                    verify=self.verify,
+                )
+                self.watsonx_model_gateway = watsonx_model_gateway
+            else:
+                watsonx_model = ModelInference(
+                    model_id=self.model_id,
+                    deployment_id=self.deployment_id,
+                    params=self.params,
+                    api_client=self.watsonx_client,
+                    project_id=self.project_id,
+                    space_id=self.space_id,
+                    verify=self.verify,
+                    validate=self.validate_model,
+                )
+                self.watsonx_model = watsonx_model
         else:
+            if sum(map(bool, (self.model, self.model_id, self.deployment_id))) != 1:
+                raise ValueError(
+                    "The parameters 'model', 'model_id' and 'deployment_id' are "
+                    "mutually exclusive. Please specify exactly one of these "
+                    "parameters when initializing ChatWatsonx."
+                )
+
             check_for_attribute(self.url, "url", "WATSONX_URL")
 
             if "cloud.ibm.com" in self.url.get_secret_value():
@@ -687,18 +732,24 @@ def validate_environment(self) -> Self:
                 version=self.version.get_secret_value() if self.version else None,
                 verify=self.verify,
             )
-
-            watsonx_chat = ModelInference(
-                model_id=self.model_id,
-                deployment_id=self.deployment_id,
-                credentials=credentials,
-                params=self.params,
-                project_id=self.project_id,
-                space_id=self.space_id,
-                verify=self.verify,
-                validate=self.validate_model,
-            )
-            self.watsonx_model = watsonx_chat
+            if self.model is not None:
+                watsonx_model_gateway = Gateway(
+                    credentials=credentials,
+                    verify=self.verify,
+                )
+                self.watsonx_model_gateway = watsonx_model_gateway
+            else:
+                watsonx_model = ModelInference(
+                    model_id=self.model_id,
+                    deployment_id=self.deployment_id,
+                    credentials=credentials,
+                    params=self.params,
+                    project_id=self.project_id,
+                    space_id=self.space_id,
+                    verify=self.verify,
+                    validate=self.validate_model,
+                )
+                self.watsonx_model = watsonx_model
 
         return self
 
@@ -717,10 +768,14 @@ def _generate(
 
         message_dicts, params = self._create_message_dicts(messages, stop, **kwargs)
         updated_params = self._merge_params(params, kwargs)
-
-        response = self.watsonx_model.chat(
-            messages=message_dicts, **(kwargs | {"params": updated_params})
-        )
+        if self.watsonx_model_gateway is not None:
+            response = self.watsonx_model_gateway.chat.completions.create(
+                model=self.model, messages=message_dicts, **(kwargs | updated_params)
+            )
+        else:
+            response = self.watsonx_model.chat(
+                messages=message_dicts, **(kwargs | {"params": updated_params})
+            )
         return self._create_chat_result(response)
 
     async def _agenerate(
@@ -738,10 +793,14 @@ async def _agenerate(
 
         message_dicts, params = self._create_message_dicts(messages, stop, **kwargs)
         updated_params = self._merge_params(params, kwargs)
-
-        response = await self.watsonx_model.achat(
-            messages=message_dicts, **(kwargs | {"params": updated_params})
-        )
+        if self.watsonx_model_gateway is not None:
+            response = await self.watsonx_model_gateway.chat.completions.acreate(
+                model=self.model, messages=message_dicts, **(kwargs | updated_params)
+            )
+        else:
+            response = await self.watsonx_model.achat(
+                messages=message_dicts, **(kwargs | {"params": updated_params})
+            )
         return self._create_chat_result(response)
 
     def _stream(
@@ -754,16 +813,23 @@ def _stream(
         message_dicts, params = self._create_message_dicts(messages, stop, **kwargs)
         updated_params = self._merge_params(params, kwargs)
 
-        default_chunk_class: Type[BaseMessageChunk] = AIMessageChunk
+        if self.watsonx_model_gateway is not None:
+            call_kwargs = {**kwargs, **updated_params, "stream": True}
+            chunk_iter = self.watsonx_model_gateway.chat.completions.create(
+                model=self.model, messages=message_dicts, **call_kwargs
+            )
+        else:
+            call_kwargs = {**kwargs, "params": updated_params}
+            chunk_iter = self.watsonx_model.chat_stream(
+                messages=message_dicts, **call_kwargs
+            )
 
+        default_chunk_class: Type[BaseMessageChunk] = AIMessageChunk
         is_first_tool_chunk = True
         _prompt_tokens_included = False
 
-        for chunk in self.watsonx_model.chat_stream(
-            messages=message_dicts, **(kwargs | {"params": updated_params})
-        ):
-            if not isinstance(chunk, dict):
-                chunk = chunk.model_dump()
+        for chunk in chunk_iter:
+            chunk = chunk if isinstance(chunk, dict) else chunk.model_dump()
             generation_chunk = _convert_chunk_to_generation_chunk(
                 chunk, default_chunk_class, is_first_tool_chunk, _prompt_tokens_included
             )
@@ -804,17 +870,23 @@ async def _astream(
         message_dicts, params = self._create_message_dicts(messages, stop, **kwargs)
         updated_params = self._merge_params(params, kwargs)
 
-        default_chunk_class: Type[BaseMessageChunk] = AIMessageChunk
+        if self.watsonx_model_gateway is not None:
+            call_kwargs = {**kwargs, **updated_params, "stream": True}
+            chunk_iter = await self.watsonx_model_gateway.chat.completions.acreate(
+                model=self.model, messages=message_dicts, **call_kwargs
+            )
+        else:
+            call_kwargs = {**kwargs, "params": updated_params}
+            chunk_iter = await self.watsonx_model.achat_stream(
+                messages=message_dicts, **call_kwargs
+            )
 
+        default_chunk_class: Type[BaseMessageChunk] = AIMessageChunk
         is_first_tool_chunk = True
         _prompt_tokens_included = False
 
-        response = await self.watsonx_model.achat_stream(
-            messages=message_dicts, **(kwargs | {"params": updated_params})
-        )
-        async for chunk in response:
-            if not isinstance(chunk, dict):
-                chunk = chunk.model_dump()
+        async for chunk in chunk_iter:
+            chunk = chunk if isinstance(chunk, dict) else chunk.model_dump()
             generation_chunk = _convert_chunk_to_generation_chunk(
                 chunk,
                 default_chunk_class,
 
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "langchain-ibm"
-version = "0.3.13"
+version = "0.3.14"
 description = "An integration package connecting IBM watsonx.ai and LangChain"
 authors = ["IBM"]
 readme = "README.md"
@@ -13,7 +13,7 @@ license = "MIT"
 [tool.poetry.dependencies]
 python = ">=3.10,<3.14"
 langchain-core = "^0.3.39"
-ibm-watsonx-ai = "^1.3.18"
+ibm-watsonx-ai = "^1.3.28"
 
 [tool.poetry.group.test]
 optional = true
 
@@ -26,6 +26,7 @@
 
 MODEL_ID = "ibm/granite-34b-code-instruct"
 MODEL_ID_TOOL = "mistralai/mistral-large"
+MODEL_ID_TOOL_2 = "meta-llama/llama-3-3-70b-instruct"
 
 PARAMS_WITH_MAX_TOKENS = {"max_tokens": 20}
 
@@ -484,7 +485,7 @@ class Person(BaseModel):
 def test_chat_bind_tools_list_tool_choice_dict() -> None:
     """Test that tool choice is respected just passing in True."""
     chat = ChatWatsonx(
-        model_id=MODEL_ID_TOOL,
+        model_id=MODEL_ID_TOOL_2,
         url=URL,  # type: ignore[arg-type]
         project_id=WX_PROJECT_ID,
         params={"temperature": 0},