oracle
diff --git a/‎libs/oci/langchain_oci/chat_models/oci_generative_ai.py‎
Lines changed: 34 additions & 3 deletions b/‎libs/oci/langchain_oci/chat_models/oci_generative_ai.py‎
Lines changed: 34 additions & 3 deletions
diff --git a/‎libs/oci/langchain_oci/chat_models/providers/cohere.py‎
Lines changed: 178 additions & 3 deletions b/‎libs/oci/langchain_oci/chat_models/providers/cohere.py‎
Lines changed: 178 additions & 3 deletions
diff --git a/‎libs/oci/langchain_oci/utils/vision.py‎
Lines changed: 2 additions & 0 deletions b/‎libs/oci/langchain_oci/utils/vision.py‎
Lines changed: 2 additions & 0 deletions
@@ -158,6 +158,9 @@ class ChatOCIGenAI(BaseChatModel, OCIGenAIBase):
         arbitrary_types_allowed=True,
     )
 
+    # Cached provider instance (not a Pydantic field to avoid serialization)
+    _cached_provider_instance: Optional[Provider] = None
+
     @property
     def _llm_type(self) -> str:
         """Return the type of the language model."""
@@ -174,8 +177,12 @@ def _provider_map(self) -> Mapping[str, Provider]:
 
     @property
     def _provider(self) -> Any:
-        """Get the internal provider object"""
-        return self._get_provider(provider_map=self._provider_map)
+        """Get the internal provider object (cached for stateful providers)."""
+        if self._cached_provider_instance is None:
+            self._cached_provider_instance = self._get_provider(
+                provider_map=self._provider_map
+            )
+        return self._cached_provider_instance
 
     def _prepare_request(
         self,
@@ -232,10 +239,34 @@ def _prepare_request(
         else:
             serving_mode = models.OnDemandServingMode(model_id=self.model_id)
 
+        # Check if V2 API should be used (currently for Cohere vision models)
+        # This flag is set by the provider's messages_to_oci_params() method when it
+        # detects multimodal content. The V2 API check is kept at this level (rather
+        # than within the provider) to maintain consistency across all providers and
+        # allow future providers to use V2 APIs without modifying core logic.
+        use_v2 = chat_params.pop("_use_v2_api", False)
+
+        if use_v2:
+            # Use V2 API: Supports multimodal content (text + images)
+            # Currently used by Cohere Command A Vision for image analysis
+            v2_request_class = getattr(self._provider, "oci_chat_request_v2", None)
+            if v2_request_class is None:
+                raise ValueError(
+                    f"V2 API is not supported by the current provider "
+                    f"({type(self._provider).__name__}). "
+                    "V2 API with multimodal support is only available for "
+                    "Cohere models."
+                )
+            chat_request = v2_request_class(**chat_params)
+        else:
+            # Use V1 API: Standard text-only chat requests
+            # Used by all models that don't require multimodal capabilities
+            chat_request = self._provider.oci_chat_request(**chat_params)
+
         request = models.ChatDetails(
             compartment_id=self.compartment_id,
             serving_mode=serving_mode,
-            chat_request=self._provider.oci_chat_request(**chat_params),
+            chat_request=chat_request,
         )
 
         return request
 
@@ -39,6 +39,14 @@ class CohereProvider(Provider):
 
     stop_sequence_key: str = "stop_sequences"
 
+    # V2 API type hints for vision support
+    oci_chat_request_v2: Optional[Type[Any]]
+    oci_chat_message_v2: Optional[Dict[str, Type[Any]]]
+    oci_text_content_v2: Optional[Type[Any]]
+    oci_image_content_v2: Optional[Type[Any]]
+    oci_image_url_v2: Optional[Type[Any]]
+    chat_api_format_v2: Optional[str]
+
     def __init__(self) -> None:
         from oci.generative_ai_inference import models
 
@@ -58,6 +66,55 @@ def __init__(self) -> None:
         self.oci_json_schema_response_format = models.JsonSchemaResponseFormat
         self.chat_api_format = models.BaseChatRequest.API_FORMAT_COHERE
 
+        # V2 API classes for vision support (cohere.command-a-vision)
+        # Note: Vision model requires dedicated AI cluster, not available on-demand
+        # Loaded lazily to avoid import errors if not available in older OCI SDK
+        self._v2_classes_loaded = False
+        self.oci_chat_request_v2 = None
+        self.oci_chat_message_v2 = None
+        self.oci_text_content_v2 = None
+        self.oci_image_content_v2 = None
+        self.oci_image_url_v2 = None
+        self.chat_api_format_v2 = None
+
+    def _load_v2_classes(self) -> None:
+        """Lazy load Cohere V2 API classes for vision support.
+
+        Note: Cohere Command A Vision (cohere.command-a-vision-07-2025) requires
+        a dedicated AI cluster. The model is available in 9 regions but not for
+        on-demand use. Implementation tested via unit tests; integration testing
+        requires dedicated cluster access.
+        """
+        if self._v2_classes_loaded:
+            return
+
+        try:
+            from oci.generative_ai_inference import models
+
+            self.oci_chat_request_v2 = models.CohereChatRequestV2
+            self.oci_chat_message_v2 = {
+                "USER": models.CohereUserMessageV2,
+                "ASSISTANT": models.CohereAssistantMessageV2,
+                "SYSTEM": models.CohereSystemMessageV2,
+                "TOOL": models.CohereToolMessageV2,
+            }
+            self.oci_text_content_v2 = models.CohereTextContentV2
+            self.oci_image_content_v2 = models.CohereImageContentV2
+            self.oci_image_url_v2 = models.CohereImageUrlV2
+            self.chat_api_format_v2 = models.CohereChatRequestV2.API_FORMAT_COHEREV2
+            # Store content type constants for use in _content_to_v2
+            self.cohere_content_v2_type_text = models.CohereContentV2.TYPE_TEXT
+            self.cohere_content_v2_type_image_url = (
+                models.CohereContentV2.TYPE_IMAGE_URL
+            )
+            self._v2_classes_loaded = True
+        except AttributeError as e:
+            raise RuntimeError(
+                "Cohere V2 API classes not available in this version of OCI SDK. "
+                "Please upgrade to the latest version to use vision features with "
+                "Cohere models."
+            ) from e
+
     def chat_response_to_text(self, response: Any) -> str:
         """Extract text from a Cohere chat response."""
         return response.data.chat_response.text
@@ -167,18 +224,132 @@ def format_stream_tool_calls(self, tool_calls: List[Any]) -> List[Dict]:
             )
         return formatted_tool_calls
 
-    def get_role(self, message: BaseMessage) -> str:
-        """Map a LangChain message to Cohere's role representation."""
+    def get_role(self, message: BaseMessage, use_v2: bool = False) -> str:
+        """Map a LangChain message to Cohere's role representation.
+
+        Args:
+            message: The LangChain message to convert
+            use_v2: If True, use V2 API role names (e.g., "ASSISTANT" for AI messages).
+                   If False, use V1 API role names (e.g., "CHATBOT" for AI messages).
+
+        Returns:
+            The role string compatible with the selected API version.
+
+        Note:
+            The key difference between V1 and V2 is the AI message role:
+            - V1 API uses "CHATBOT" for AI-generated messages
+            - V2 API uses "ASSISTANT" for AI-generated messages (multimodal support)
+            All other roles (USER, SYSTEM, TOOL) are the same across both APIs.
+        """
         if isinstance(message, HumanMessage):
             return "USER"
         elif isinstance(message, AIMessage):
-            return "CHATBOT"
+            # V1 uses "CHATBOT", V2 uses "ASSISTANT" for AI messages
+            return "ASSISTANT" if use_v2 else "CHATBOT"
         elif isinstance(message, SystemMessage):
             return "SYSTEM"
         elif isinstance(message, ToolMessage):
             return "TOOL"
         raise ValueError(f"Unknown message type: {type(message)}")
 
+    def _has_vision_content(self, messages: Sequence[BaseMessage]) -> bool:
+        """Check if any message contains image content."""
+        for msg in messages:
+            # Both HumanMessage and SystemMessage can contain multimodal content
+            if isinstance(msg, (HumanMessage, SystemMessage)) and isinstance(
+                msg.content, list
+            ):
+                for block in msg.content:
+                    if isinstance(block, dict) and block.get("type") == "image_url":
+                        # Load V2 classes now that we know we need them
+                        self._load_v2_classes()
+                        return True
+        return False
+
+    def _content_to_v2(self, content: Union[str, List]) -> List[Any]:
+        """Convert LangChain message content to Cohere V2 content format."""
+        assert self.oci_text_content_v2 is not None, "V2 classes must be loaded"
+        assert self.oci_image_content_v2 is not None, "V2 classes must be loaded"
+        assert self.oci_image_url_v2 is not None, "V2 classes must be loaded"
+
+        if isinstance(content, str):
+            return [
+                self.oci_text_content_v2(
+                    type=self.cohere_content_v2_type_text, text=content
+                )
+            ]
+
+        v2_content = []
+        for block in content:
+            if isinstance(block, dict):
+                if block.get("type") == "text":
+                    v2_content.append(
+                        self.oci_text_content_v2(
+                            type=self.cohere_content_v2_type_text,
+                            text=block["text"],
+                        )
+                    )
+                elif block.get("type") == "image_url":
+                    image_url = block.get("image_url", {})
+                    url = (
+                        image_url.get("url")
+                        if isinstance(image_url, dict)
+                        else image_url
+                    )
+                    v2_content.append(
+                        self.oci_image_content_v2(
+                            type=self.cohere_content_v2_type_image_url,
+                            image_url=self.oci_image_url_v2(url=url),
+                        )
+                    )
+            elif isinstance(block, str):
+                v2_content.append(
+                    self.oci_text_content_v2(
+                        type=self.cohere_content_v2_type_text, text=block
+                    )
+                )
+        return v2_content
+
+    def _messages_to_oci_params_v2(
+        self, messages: Sequence[BaseMessage], **kwargs: Any
+    ) -> Dict[str, Any]:
+        """
+        Convert LangChain messages to OCI parameters for Cohere V2 API (vision support).
+        """
+        assert self.oci_chat_message_v2 is not None, "V2 classes must be loaded"
+        assert self.chat_api_format_v2 is not None, "V2 classes must be loaded"
+
+        v2_messages = []
+
+        for msg in messages:
+            role = self.get_role(msg, use_v2=True)
+            if isinstance(msg, (HumanMessage, SystemMessage)):
+                # User/system messages can contain multimodal content (text + images)
+                content = self._content_to_v2(msg.content)
+                v2_messages.append(
+                    self.oci_chat_message_v2[role](role=role, content=content)
+                )
+            elif isinstance(msg, AIMessage):
+                # AI messages always require non-empty content in V2 API
+                # Use space as fallback if empty to satisfy API requirements
+                content = self._content_to_v2(msg.content if msg.content else " ")
+                v2_messages.append(
+                    self.oci_chat_message_v2[role](role=role, content=content)
+                )
+            elif isinstance(msg, ToolMessage):
+                raise NotImplementedError(
+                    "Tool messages are not yet supported with Cohere V2 API. "
+                    "Cohere vision models currently support text and image "
+                    "content only."
+                )
+
+        oci_params = {
+            "messages": v2_messages,
+            "api_format": self.chat_api_format_v2,
+            "_use_v2_api": True,  # Flag to indicate V2 API should be used
+        }
+        return {k: v for k, v in oci_params.items() if v is not None}
+
     def messages_to_oci_params(
         self, messages: Sequence[BaseMessage], **kwargs: Any
     ) -> Dict[str, Any]:
@@ -187,6 +358,10 @@ def messages_to_oci_params(
 
         This includes conversion of chat history and tool call results.
         """
+        # Check if vision content is present - if so, use V2 API
+        if self._has_vision_content(messages):
+            return self._messages_to_oci_params_v2(messages, **kwargs)
+
         # Cohere models don't support parallel tool calls
         if kwargs.get("is_parallel_tool_calls"):
             raise ValueError(
 
@@ -43,6 +43,8 @@
     "xai.grok-4-1-fast-non-reasoning",
     "xai.grok-4-fast-reasoning",
     "xai.grok-4-fast-non-reasoning",
+    # Cohere models
+    "cohere.command-a-vision",
 ]
Original file line number	Diff line number	Diff line change
`@@ -43,6 +43,8 @@`
`43`	`43`	`"xai.grok-4-1-fast-non-reasoning",`
`44`	`44`	`"xai.grok-4-fast-reasoning",`
`45`	`45`	`"xai.grok-4-fast-non-reasoning",`
	`46`	`+ # Cohere models`
	`47`	`+ "cohere.command-a-vision",`
`46`	`48`	`]`
`47`	`49`
`48`	`50`