oracle
diff --git a/‎libs/oci/langchain_oci/__init__.py‎
Lines changed: 15 additions & 1 deletion b/‎libs/oci/langchain_oci/__init__.py‎
Lines changed: 15 additions & 1 deletion
diff --git a/‎libs/oci/langchain_oci/chat_models/__init__.py‎
Lines changed: 7 additions & 3 deletions b/‎libs/oci/langchain_oci/chat_models/__init__.py‎
Lines changed: 7 additions & 3 deletions
diff --git a/‎libs/oci/langchain_oci/chat_models/oci_data_science.py‎
Lines changed: 39 additions & 6 deletions b/‎libs/oci/langchain_oci/chat_models/oci_data_science.py‎
Lines changed: 39 additions & 6 deletions
diff --git a/‎libs/oci/langchain_oci/embeddings/__init__.py‎
Lines changed: 3 additions & 2 deletions b/‎libs/oci/langchain_oci/embeddings/__init__.py‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎libs/oci/langchain_oci/embeddings/oci_data_science_model_deployment_endpoint.py‎
Lines changed: 205 additions & 0 deletions b/‎libs/oci/langchain_oci/embeddings/oci_data_science_model_deployment_endpoint.py‎
Lines changed: 205 additions & 0 deletions
diff --git a/‎libs/oci/langchain_oci/llms/__init__.py‎
Lines changed: 5 additions & 1 deletion b/‎libs/oci/langchain_oci/llms/__init__.py‎
Lines changed: 5 additions & 1 deletion
@@ -1,19 +1,33 @@
-# Copyright (c) 2023 Oracle and/or its affiliates.
+# Copyright (c) 2025 Oracle and/or its affiliates.
 # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
 
 from langchain_oci.chat_models.oci_generative_ai import ChatOCIGenAI
+from langchain_oci.chat_models.oci_data_science import (
+    ChatOCIModelDeployment,
+    ChatOCIModelDeploymentTGI,
+    ChatOCIModelDeploymentVLLM
+)
 from langchain_oci.embeddings.oci_generative_ai import OCIGenAIEmbeddings
+from langchain_oci.embeddings.oci_data_science_model_deployment_endpoint import OCIModelDeploymentEndpointEmbeddings
 from langchain_oci.llms.oci_data_science_model_deployment_endpoint import (
     BaseOCIModelDeployment,
     OCIModelDeploymentLLM,
+    OCIModelDeploymentTGI,
+    OCIModelDeploymentVLLM,
 )
 from langchain_oci.llms.oci_generative_ai import OCIGenAI, OCIGenAIBase
 
 __all__ = [
     "ChatOCIGenAI",
+    "ChatOCIModelDeployment",
+    "ChatOCIModelDeploymentTGI",
+    "ChatOCIModelDeploymentVLLM",
     "OCIGenAIEmbeddings",
+    "OCIModelDeploymentEndpointEmbeddings",
     "OCIGenAIBase",
     "OCIGenAI",
     "BaseOCIModelDeployment",
     "OCIModelDeploymentLLM",
+    "OCIModelDeploymentTGI",
+    "OCIModelDeploymentVLLM",
 ]
@@ -1,7 +1,11 @@
-# Copyright (c) 2023 Oracle and/or its affiliates.
+# Copyright (c) 2025 Oracle and/or its affiliates.
 # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
 
-from langchain_oci.chat_models.oci_data_science import ChatOCIModelDeployment
+from langchain_oci.chat_models.oci_data_science import (
+    ChatOCIModelDeployment,
+    ChatOCIModelDeploymentTGI,
+    ChatOCIModelDeploymentVLLM
+)
 from langchain_oci.chat_models.oci_generative_ai import ChatOCIGenAI
 
-__all__ = ["ChatOCIGenAI", "ChatOCIModelDeployment"]
+__all__ = ["ChatOCIGenAI", "ChatOCIModelDeployment", "ChatOCIModelDeploymentTGI", "ChatOCIModelDeploymentVLLM"]
@@ -1,4 +1,4 @@
-# Copyright (c) 2023 Oracle and/or its affiliates.
+# Copyright (c) 2025 Oracle and/or its affiliates.
 # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
 
 """Chat model for OCI data science model deployment endpoint."""
@@ -48,6 +48,7 @@
 )
 
 logger = logging.getLogger(__name__)
+DEFAULT_INFERENCE_ENDPOINT_CHAT = "/v1/chat/completions"
 
 
 def _is_pydantic_class(obj: Any) -> bool:
@@ -57,6 +58,13 @@ def _is_pydantic_class(obj: Any) -> bool:
 class ChatOCIModelDeployment(BaseChatModel, BaseOCIModelDeployment):
     """OCI Data Science Model Deployment chat model integration.
 
+    Prerequisite
+        The OCI Model Deployment plugins are installable only on
+        python version 3.9 and above. If you're working inside the notebook,
+        try installing the python 3.10 based conda pack and running the
+        following setup.
+
+
     Setup:
         Install ``oracle-ads`` and ``langchain-openai``.
 
@@ -91,22 +99,28 @@ class ChatOCIModelDeployment(BaseChatModel, BaseOCIModelDeployment):
     Key init args — client params:
         auth: dict
             ADS auth dictionary for OCI authentication.
+        default_headers: Optional[Dict]
+            The headers to be added to the Model Deployment request.
 
     Instantiate:
         .. code-block:: python
 
-            from langchain_community.chat_models import ChatOCIModelDeployment
+            from langchain_oci.chat_models import ChatOCIModelDeployment
 
             chat = ChatOCIModelDeployment(
                 endpoint="https://modeldeployment.<region>.oci.customer-oci.com/<ocid>/predict",
-                model="odsc-llm",
+                model="odsc-llm", # this is the default model name if deployed with AQUA
                 streaming=True,
                 max_retries=3,
                 model_kwargs={
                     "max_token": 512,
                     "temperature": 0.2,
                     # other model parameters ...
                 },
+                default_headers={
+                    "route": "/v1/chat/completions",
+                    # other request headers ...
+                },
             )
 
     Invocation:
@@ -289,6 +303,25 @@ def _default_params(self) -> Dict[str, Any]:
             "stream": self.streaming,
         }
 
+    def _headers(
+        self, is_async: Optional[bool] = False, body: Optional[dict] = None
+    ) -> Dict:
+        """Construct and return the headers for a request.
+
+        Args:
+            is_async (bool, optional): Indicates if the request is asynchronous.
+                Defaults to `False`.
+            body (optional): The request body to be included in the headers if
+                the request is asynchronous.
+
+        Returns:
+            Dict: A dictionary containing the appropriate headers for the request.
+        """
+        return {
+            "route": DEFAULT_INFERENCE_ENDPOINT_CHAT,
+            **super()._headers(is_async=is_async, body=body),
+        }
+
     def _generate(
         self,
         messages: List[BaseMessage],
@@ -702,7 +735,7 @@ def _process_response(self, response_json: dict) -> ChatResult:
 
         for choice in choices:
             message = _convert_dict_to_message(choice["message"])
-            generation_info = dict(finish_reason=choice.get("finish_reason"))
+            generation_info = {"finish_reason": choice.get("finish_reason")}
             if "logprobs" in choice:
                 generation_info["logprobs"] = choice["logprobs"]
 
@@ -746,7 +779,7 @@ class ChatOCIModelDeploymentVLLM(ChatOCIModelDeployment):
 
         .. code-block:: python
 
-            from langchain_community.chat_models import ChatOCIModelDeploymentVLLM
+            from langchain_oci.chat_models import ChatOCIModelDeploymentVLLM
 
             chat = ChatOCIModelDeploymentVLLM(
                 endpoint="https://modeldeployment.us-ashburn-1.oci.customer-oci.com/<ocid>/predict",
@@ -913,7 +946,7 @@ class ChatOCIModelDeploymentTGI(ChatOCIModelDeployment):
 
         .. code-block:: python
 
-            from langchain_community.chat_models import ChatOCIModelDeploymentTGI
+            from langchain_oci.chat_models import ChatOCIModelDeploymentTGI
 
             chat = ChatOCIModelDeploymentTGI(
                 endpoint="https://modeldeployment.us-ashburn-1.oci.customer-oci.com/<ocid>/predict",
 
@@ -1,6 +1,7 @@
-# Copyright (c) 2023 Oracle and/or its affiliates.
+# Copyright (c) 2025 Oracle and/or its affiliates.
 # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
 
+from langchain_oci.embeddings.oci_data_science_model_deployment_endpoint import OCIModelDeploymentEndpointEmbeddings
 from langchain_oci.embeddings.oci_generative_ai import OCIGenAIEmbeddings
 
-__all__ = ["OCIGenAIEmbeddings"]
+__all__ = ["OCIModelDeploymentEndpointEmbeddings", "OCIGenAIEmbeddings"]
@@ -0,0 +1,205 @@
+# Copyright (c) 2025 Oracle and/or its affiliates.
+# Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
+
+from langchain_core.embeddings import Embeddings
+from langchain_core.language_models.llms import create_base_retry_decorator
+from langchain_core.utils import get_from_dict_or_env
+from pydantic import BaseModel, Field, model_validator
+import requests
+from typing import Any, Callable, Dict, List, Mapping, Optional
+
+
+DEFAULT_HEADER = {
+    "Content-Type": "application/json",
+}
+
+
+class TokenExpiredError(Exception):
+    pass
+
+
+def _create_retry_decorator(llm) -> Callable[[Any], Any]:
+    """Creates a retry decorator."""
+    errors = [requests.exceptions.ConnectTimeout, TokenExpiredError]
+    decorator = create_base_retry_decorator(
+        error_types=errors, max_retries=llm.max_retries
+    )
+    return decorator
+
+
+class OCIModelDeploymentEndpointEmbeddings(BaseModel, Embeddings):
+    """Embedding model deployed on OCI Data Science Model Deployment.
+
+    Example:
+
+        .. code-block:: python
+
+            from langchain_oci.embeddings import OCIModelDeploymentEndpointEmbeddings
+
+            embeddings = OCIModelDeploymentEndpointEmbeddings(
+                endpoint="https://modeldeployment.us-ashburn-1.oci.customer-oci.com/<md_ocid>/predict",
+            )
+    """ # noqa: E501
+
+    auth: dict = Field(default_factory=dict, exclude=True)
+    """ADS auth dictionary for OCI authentication:
+    https://accelerated-data-science.readthedocs.io/en/latest/user_guide/cli/authentication.html.
+    This can be generated by calling `ads.common.auth.api_keys()`
+    or `ads.common.auth.resource_principal()`. If this is not
+    provided then the `ads.common.default_signer()` will be used."""
+
+    endpoint: str = ""
+    """The uri of the endpoint from the deployed Model Deployment model."""
+
+    model_kwargs: Optional[Dict] = None
+    """Keyword arguments to pass to the model."""
+
+    endpoint_kwargs: Optional[Dict] = None
+    """Optional attributes (except for headers) passed to the request.post
+    function. 
+    """
+
+    max_retries: int = 1
+    """The maximum number of retries to make when generating."""
+
+    @model_validator(mode="before")
+    def validate_environment(  # pylint: disable=no-self-argument
+        cls, values: Dict
+    ) -> Dict:
+        """Validate that python package exists in environment."""
+        try:
+            import ads
+
+        except ImportError as ex:
+            raise ImportError(
+                "Could not import ads python package. "
+                "Please install it with `pip install oracle_ads`."
+            ) from ex
+        if not values.get("auth", None):
+            values["auth"] = ads.common.auth.default_signer()
+        values["endpoint"] = get_from_dict_or_env(
+            values,
+            "endpoint",
+            "OCI_LLM_ENDPOINT",
+        )
+        return values
+
+    @property
+    def _identifying_params(self) -> Mapping[str, Any]:
+        """Get the identifying parameters."""
+        _model_kwargs = self.model_kwargs or {}
+        return {
+            **{"endpoint": self.endpoint},
+            **{"model_kwargs": _model_kwargs},
+        }
+
+    def _embed_with_retry(self, **kwargs) -> Any:
+        """Use tenacity to retry the call."""
+        retry_decorator = _create_retry_decorator(self)
+
+        @retry_decorator
+        def _completion_with_retry(**kwargs: Any) -> Any:
+            try:
+                response = requests.post(self.endpoint, **kwargs)
+                response.raise_for_status()
+                return response
+            except requests.exceptions.HTTPError as http_err:
+                if response.status_code == 401 and self._refresh_signer():
+                    raise TokenExpiredError() from http_err
+                else:
+                    raise ValueError(
+                        f"Server error: {str(http_err)}. Message: {response.text}"
+                    ) from http_err
+            except Exception as e:
+                raise ValueError(f"Error occurs by inference endpoint: {str(e)}") from e
+
+        return _completion_with_retry(**kwargs)
+
+    def _embedding(self, texts: List[str]) -> List[List[float]]:
+        """Call out to OCI Data Science Model Deployment Endpoint.
+
+        Args:
+            texts: A list of texts to embed.
+
+        Returns:
+            A list of list of floats representing the embeddings, or None if an
+            error occurs.
+        """
+        _model_kwargs = self.model_kwargs or {}
+        body = self._construct_request_body(texts, _model_kwargs)
+        request_kwargs = self._construct_request_kwargs(body)
+        response = self._embed_with_retry(**request_kwargs)
+        return self._proceses_response(response)
+
+    def _construct_request_kwargs(self, body: Any) -> dict:
+        """Constructs the request kwargs as a dictionary."""
+        from ads.model.common.utils import _is_json_serializable
+
+        _endpoint_kwargs = self.endpoint_kwargs or {}
+        headers = _endpoint_kwargs.pop("headers", DEFAULT_HEADER)
+        return (
+            dict(
+                headers=headers,
+                json=body,
+                auth=self.auth.get("signer"),
+                **_endpoint_kwargs,
+            )
+            if _is_json_serializable(body)
+            else dict(
+                headers=headers,
+                data=body,
+                auth=self.auth.get("signer"),
+                **_endpoint_kwargs,
+            )
+        )
+
+    def _construct_request_body(self, texts: List[str], params: dict) -> Any:
+        """Constructs the request body."""
+        return {"input": texts}
+
+    def _proceses_response(self, response: requests.Response) -> List[List[float]]:
+        """Extracts results from requests.Response."""
+        try:
+            res_json = response.json()
+            embeddings = res_json["data"][0]["embedding"]
+        except Exception as e:
+            raise ValueError(
+                f"Error raised by inference API: {e}.\nResponse: {response.text}"
+            )
+        return embeddings
+
+    def embed_documents(
+        self,
+        texts: List[str],
+        chunk_size: Optional[int] = None,
+    ) -> List[List[float]]:
+        """Compute doc embeddings using OCI Data Science Model Deployment Endpoint.
+
+        Args:
+            texts: The list of texts to embed.
+            chunk_size: The chunk size defines how many input texts will
+                be grouped together as request. If None, will use the
+                chunk size specified by the class.
+
+        Returns:
+            List of embeddings, one for each text.
+        """
+        results = []
+        _chunk_size = (
+            len(texts) if (not chunk_size or chunk_size > len(texts)) else chunk_size
+        )
+        for i in range(0, len(texts), _chunk_size):
+            response = self._embedding(texts[i : i + _chunk_size])
+            results.extend(response)
+        return results
+
+    def embed_query(self, text: str) -> List[float]:
+        """Compute query embeddings using OCI Data Science Model Deployment Endpoint.
+
+        Args:
+            text: The text to embed.
+
+        Returns:
+            Embeddings for the text.
+        """
+        return self._embedding([text])[0]
@@ -1,9 +1,11 @@
-# Copyright (c) 2023 Oracle and/or its affiliates.
+# Copyright (c) 2025 Oracle and/or its affiliates.
 # Licensed under the Universal Permissive License v 1.0 as shown at https://oss.oracle.com/licenses/upl/
 
 from langchain_oci.llms.oci_data_science_model_deployment_endpoint import (
     BaseOCIModelDeployment,
     OCIModelDeploymentLLM,
+    OCIModelDeploymentTGI,
+    OCIModelDeploymentVLLM,
 )
 from langchain_oci.llms.oci_generative_ai import OCIGenAI, OCIGenAIBase
 
@@ -12,4 +14,6 @@
     "OCIGenAI",
     "BaseOCIModelDeployment",
     "OCIModelDeploymentLLM",
+    "OCIModelDeploymentTGI",
+    "OCIModelDeploymentVLLM",
 ]