langchain/libs/community/langchain_community/llms/oci_generative_ai.py

from __future__ import annotations

from abc import ABC
from enum import Enum
from typing import Any, Dict, List, Mapping, Optional

from langchain_core.callbacks import CallbackManagerForLLMRun
from langchain_core.language_models.llms import LLM
from langchain_core.pydantic_v1 import BaseModel, Extra, root_validator

from langchain_community.llms.utils import enforce_stop_tokens

CUSTOM_ENDPOINT_PREFIX = "ocid1.generativeaiendpoint"
VALID_PROVIDERS = ("cohere", "meta")


class OCIAuthType(Enum):
    API_KEY = 1
    SECURITY_TOKEN = 2
    INSTANCE_PRINCIPAL = 3
    RESOURCE_PRINCIPAL = 4


class OCIGenAIBase(BaseModel, ABC):
    """Base class for OCI GenAI models"""

    client: Any  #: :meta private:

    auth_type: Optional[str] = "API_KEY"
    """Authentication type, could be 
    
    API_KEY, 
    SECURITY_TOKEN, 
    INSTANCE_PRINCIPLE, 
    RESOURCE_PRINCIPLE

    If not specified, API_KEY will be used
    """

    auth_profile: Optional[str] = "DEFAULT"
    """The name of the profile in ~/.oci/config
    If not specified , DEFAULT will be used 
    """

    model_id: str = None
    """Id of the model to call, e.g., cohere.command"""

    provider: str = None
    """Provider name of the model. Default to None, 
    will try to be derived from the model_id
    otherwise, requires user input
    """

    model_kwargs: Optional[Dict] = None
    """Keyword arguments to pass to the model"""

    service_endpoint: str = None
    """service endpoint url"""

    compartment_id: str = None
    """OCID of compartment"""

    is_stream: bool = False
    """Whether to stream back partial progress"""

    llm_stop_sequence_mapping: Mapping[str, str] = {
        "cohere": "stop_sequences",
        "meta": "stop",
    }

    @root_validator()
    def validate_environment(cls, values: Dict) -> Dict:
        """Validate that OCI config and python package exists in environment."""

        # Skip creating new client if passed in constructor
        if values["client"] is not None:
            return values

        try:
            import oci

            client_kwargs = {
                "config": {},
                "signer": None,
                "service_endpoint": values["service_endpoint"],
                "retry_strategy": oci.retry.DEFAULT_RETRY_STRATEGY,
                "timeout": (10, 240),  # default timeout config for OCI Gen AI service
            }

            if values["auth_type"] == OCIAuthType(1).name:
                client_kwargs["config"] = oci.config.from_file(
                    profile_name=values["auth_profile"]
                )
                client_kwargs.pop("signer", None)
            elif values["auth_type"] == OCIAuthType(2).name:

                def make_security_token_signer(oci_config):
                    pk = oci.signer.load_private_key_from_file(
                        oci_config.get("key_file"), None
                    )
                    with open(
                        oci_config.get("security_token_file"), encoding="utf-8"
                    ) as f:
                        st_string = f.read()
                    return oci.auth.signers.SecurityTokenSigner(st_string, pk)

                client_kwargs["config"] = oci.config.from_file(
                    profile_name=values["auth_profile"]
                )
                client_kwargs["signer"] = make_security_token_signer(
                    oci_config=client_kwargs["config"]
                )
            elif values["auth_type"] == OCIAuthType(3).name:
                client_kwargs[
                    "signer"
                ] = oci.auth.signers.InstancePrincipalsSecurityTokenSigner()
            elif values["auth_type"] == OCIAuthType(4).name:
                client_kwargs[
                    "signer"
                ] = oci.auth.signers.get_resource_principals_signer()
            else:
                raise ValueError("Please provide valid value to auth_type")

            values["client"] = oci.generative_ai_inference.GenerativeAiInferenceClient(
                **client_kwargs
            )

        except ImportError as ex:
            raise ModuleNotFoundError(
                "Could not import oci python package. "
                "Please make sure you have the oci package installed."
            ) from ex
        except Exception as e:
            raise ValueError(
                "Could not authenticate with OCI client. "
                "Please check if ~/.oci/config exists. "
                "If INSTANCE_PRINCIPLE or RESOURCE_PRINCIPLE is used, "
                "Please check the specified "
                "auth_profile and auth_type are valid."
            ) from e

        return values

    @property
    def _identifying_params(self) -> Mapping[str, Any]:
        """Get the identifying parameters."""
        _model_kwargs = self.model_kwargs or {}
        return {
            **{"model_kwargs": _model_kwargs},
        }

    def _get_provider(self) -> str:
        if self.provider is not None:
            provider = self.provider
        else:
            provider = self.model_id.split(".")[0].lower()

        if provider not in VALID_PROVIDERS:
            raise ValueError(
                f"Invalid provider derived from model_id: {self.model_id} "
                "Please explicitly pass in the supported provider "
                "when using custom endpoint"
            )
        return provider


class OCIGenAI(LLM, OCIGenAIBase):
    """OCI large language models.

    To authenticate, the OCI client uses the methods described in
    https://docs.oracle.com/en-us/iaas/Content/API/Concepts/sdk_authentication_methods.htm

    The authentifcation method is passed through auth_type and should be one of:
    API_KEY (default), SECURITY_TOKEN, INSTANCE_PRINCIPLE, RESOURCE_PRINCIPLE

    Make sure you have the required policies (profile/roles) to
    access the OCI Generative AI service.
    If a specific config profile is used, you must pass
    the name of the profile (from ~/.oci/config) through auth_profile.

    To use, you must provide the compartment id
    along with the endpoint url, and model id
    as named parameters to the constructor.

    Example:
        .. code-block:: python

            from langchain_community.llms import OCIGenAI

            llm = OCIGenAI(
                    model_id="MY_MODEL_ID",
                    service_endpoint="https://inference.generativeai.us-chicago-1.oci.oraclecloud.com",
                    compartment_id="MY_OCID"
                )
    """

    class Config:
        """Configuration for this pydantic object."""

        extra = Extra.forbid

    @property
    def _llm_type(self) -> str:
        """Return type of llm."""
        return "oci"

    def _prepare_invocation_object(
        self, prompt: str, stop: Optional[List[str]], kwargs: Dict[str, Any]
    ) -> Dict[str, Any]:
        from oci.generative_ai_inference import models

        oci_llm_request_mapping = {
            "cohere": models.CohereLlmInferenceRequest,
            "meta": models.LlamaLlmInferenceRequest,
        }
        provider = self._get_provider()
        _model_kwargs = self.model_kwargs or {}
        if stop is not None:
            _model_kwargs[self.llm_stop_sequence_mapping[provider]] = stop

        if self.model_id.startswith(CUSTOM_ENDPOINT_PREFIX):
            serving_mode = models.DedicatedServingMode(endpoint_id=self.model_id)
        else:
            serving_mode = models.OnDemandServingMode(model_id=self.model_id)

        inference_params = {**_model_kwargs, **kwargs}
        inference_params["prompt"] = prompt
        inference_params["is_stream"] = self.is_stream

        invocation_obj = models.GenerateTextDetails(
            compartment_id=self.compartment_id,
            serving_mode=serving_mode,
            inference_request=oci_llm_request_mapping[provider](**inference_params),
        )

        return invocation_obj

    def _process_response(self, response: Any, stop: Optional[List[str]]) -> str:
        provider = self._get_provider()
        if provider == "cohere":
            text = response.data.inference_response.generated_texts[0].text
        elif provider == "meta":
            text = response.data.inference_response.choices[0].text
        else:
            raise ValueError(f"Invalid provider: {provider}")

        if stop is not None:
            text = enforce_stop_tokens(text, stop)

        return text

    def _call(
        self,
        prompt: str,
        stop: Optional[List[str]] = None,
        run_manager: Optional[CallbackManagerForLLMRun] = None,
        **kwargs: Any,
    ) -> str:
        """Call out to OCIGenAI generate endpoint.

        Args:
            prompt: The prompt to pass into the model.
            stop: Optional list of stop words to use when generating.

        Returns:
            The string generated by the model.

        Example:
            .. code-block:: python

               response = llm.invoke("Tell me a joke.")
        """

        invocation_obj = self._prepare_invocation_object(prompt, stop, kwargs)
        response = self.client.generate_text(invocation_obj)
        return self._process_response(response, stop)
community[minor]: Add OCI Generative AI integration (#16548) <!-- Thank you for contributing to LangChain! Please title your PR "<package>: <description>", where <package> is whichever of langchain, community, core, experimental, etc. is being modified. Replace this entire comment with: - Description: Adding Oracle Cloud Infrastructure Generative AI integration. Oracle Cloud Infrastructure (OCI) Generative AI is a fully managed service that provides a set of state-of-the-art, customizable large language models (LLMs) that cover a wide range of use cases, and which is available through a single API. Using the OCI Generative AI service you can access ready-to-use pretrained models, or create and host your own fine-tuned custom models based on your own data on dedicated AI clusters. https://docs.oracle.com/en-us/iaas/Content/generative-ai/home.htm - Issue: None, - Dependencies: OCI Python SDK, - Twitter handle: we announce bigger features on Twitter. If your PR gets announced, and you'd like a mention, we'll gladly shout you out! Please make sure your PR is passing linting and testing before submitting. Run `make format`, `make lint` and `make test` from the root of the package you've modified to check this locally. Passed See contribution guidelines for more information on how to write/run tests, lint, etc: https://python.langchain.com/docs/contributing/ If you're adding a new integration, please include: 1. a test for the integration, preferably unit tests that do not rely on network access, 2. an example notebook showing its use. It lives in `docs/docs/integrations` directory. we provide unit tests. However, we cannot provide integration tests due to Oracle policies that prohibit public sharing of api keys. If no one reviews your PR within a few days, please @-mention one of @baskaryan, @eyurtsev, @hwchase17. --> --------- Co-authored-by: Arthur Cheng <arthur.cheng@oracle.com> Co-authored-by: Bagatur <baskaryan@gmail.com> 8 months ago			`from __future__ import annotations`

			`from abc import ABC`
			`from enum import Enum`
			`from typing import Any, Dict, List, Mapping, Optional`

			`from langchain_core.callbacks import CallbackManagerForLLMRun`
			`from langchain_core.language_models.llms import LLM`
			`from langchain_core.pydantic_v1 import BaseModel, Extra, root_validator`

			`from langchain_community.llms.utils import enforce_stop_tokens`

			`CUSTOM_ENDPOINT_PREFIX = "ocid1.generativeaiendpoint"`
			`VALID_PROVIDERS = ("cohere", "meta")`


			`class OCIAuthType(Enum):`
			`API_KEY = 1`
			`SECURITY_TOKEN = 2`
			`INSTANCE_PRINCIPAL = 3`
			`RESOURCE_PRINCIPAL = 4`


			`class OCIGenAIBase(BaseModel, ABC):`
			`"""Base class for OCI GenAI models"""`

			`client: Any #: :meta private:`

			`auth_type: Optional[str] = "API_KEY"`
			`"""Authentication type, could be`

			`API_KEY,`
			`SECURITY_TOKEN,`
			`INSTANCE_PRINCIPLE,`
			`RESOURCE_PRINCIPLE`

			`If not specified, API_KEY will be used`
			`"""`

			`auth_profile: Optional[str] = "DEFAULT"`
			`"""The name of the profile in ~/.oci/config`
			`If not specified , DEFAULT will be used`
			`"""`

			`model_id: str = None`
			`"""Id of the model to call, e.g., cohere.command"""`

			`provider: str = None`
			`"""Provider name of the model. Default to None,`
			`will try to be derived from the model_id`
			`otherwise, requires user input`
			`"""`

			`model_kwargs: Optional[Dict] = None`
			`"""Keyword arguments to pass to the model"""`

			`service_endpoint: str = None`
			`"""service endpoint url"""`

			`compartment_id: str = None`
			`"""OCID of compartment"""`

			`is_stream: bool = False`
			`"""Whether to stream back partial progress"""`

			`llm_stop_sequence_mapping: Mapping[str, str] = {`
			`"cohere": "stop_sequences",`
			`"meta": "stop",`
			`}`

			`@root_validator()`
			`def validate_environment(cls, values: Dict) -> Dict:`
			`"""Validate that OCI config and python package exists in environment."""`

			`# Skip creating new client if passed in constructor`
			`if values["client"] is not None:`
			`return values`

			`try:`
			`import oci`

			`client_kwargs = {`
			`"config": {},`
			`"signer": None,`
			`"service_endpoint": values["service_endpoint"],`
			`"retry_strategy": oci.retry.DEFAULT_RETRY_STRATEGY,`
			`"timeout": (10, 240), # default timeout config for OCI Gen AI service`
			`}`

			`if values["auth_type"] == OCIAuthType(1).name:`
			`client_kwargs["config"] = oci.config.from_file(`
			`profile_name=values["auth_profile"]`
			`)`
			`client_kwargs.pop("signer", None)`
			`elif values["auth_type"] == OCIAuthType(2).name:`

			`def make_security_token_signer(oci_config):`
			`pk = oci.signer.load_private_key_from_file(`
			`oci_config.get("key_file"), None`
			`)`
			`with open(`
			`oci_config.get("security_token_file"), encoding="utf-8"`
			`) as f:`
			`st_string = f.read()`
			`return oci.auth.signers.SecurityTokenSigner(st_string, pk)`

			`client_kwargs["config"] = oci.config.from_file(`
			`profile_name=values["auth_profile"]`
			`)`
			`client_kwargs["signer"] = make_security_token_signer(`
			`oci_config=client_kwargs["config"]`
			`)`
			`elif values["auth_type"] == OCIAuthType(3).name:`
			`client_kwargs[`
			`"signer"`
			`] = oci.auth.signers.InstancePrincipalsSecurityTokenSigner()`
			`elif values["auth_type"] == OCIAuthType(4).name:`
			`client_kwargs[`
			`"signer"`
			`] = oci.auth.signers.get_resource_principals_signer()`
			`else:`
			`raise ValueError("Please provide valid value to auth_type")`

			`values["client"] = oci.generative_ai_inference.GenerativeAiInferenceClient(`
			`**client_kwargs`
			`)`

			`except ImportError as ex:`
			`raise ModuleNotFoundError(`
			`"Could not import oci python package. "`
			`"Please make sure you have the oci package installed."`
			`) from ex`
			`except Exception as e:`
			`raise ValueError(`
			`"Could not authenticate with OCI client. "`
			`"Please check if ~/.oci/config exists. "`
			`"If INSTANCE_PRINCIPLE or RESOURCE_PRINCIPLE is used, "`
			`"Please check the specified "`
			`"auth_profile and auth_type are valid."`
			`) from e`

			`return values`

			`@property`
			`def _identifying_params(self) -> Mapping[str, Any]:`
			`"""Get the identifying parameters."""`
			`_model_kwargs = self.model_kwargs or {}`
			`return {`
			`**{"model_kwargs": _model_kwargs},`
			`}`

			`def _get_provider(self) -> str:`
			`if self.provider is not None:`
			`provider = self.provider`
			`else:`
			`provider = self.model_id.split(".")[0].lower()`

			`if provider not in VALID_PROVIDERS:`
			`raise ValueError(`
			`f"Invalid provider derived from model_id: {self.model_id} "`
			`"Please explicitly pass in the supported provider "`
			`"when using custom endpoint"`
			`)`
			`return provider`


			`class OCIGenAI(LLM, OCIGenAIBase):`
			`"""OCI large language models.`

			`To authenticate, the OCI client uses the methods described in`
			`https://docs.oracle.com/en-us/iaas/Content/API/Concepts/sdk_authentication_methods.htm`

			`The authentifcation method is passed through auth_type and should be one of:`
			`API_KEY (default), SECURITY_TOKEN, INSTANCE_PRINCIPLE, RESOURCE_PRINCIPLE`

			`Make sure you have the required policies (profile/roles) to`
			`access the OCI Generative AI service.`
			`If a specific config profile is used, you must pass`
			`the name of the profile (from ~/.oci/config) through auth_profile.`

			`To use, you must provide the compartment id`
			`along with the endpoint url, and model id`
			`as named parameters to the constructor.`

			`Example:`
			`.. code-block:: python`

			`from langchain_community.llms import OCIGenAI`

			`llm = OCIGenAI(`
			`model_id="MY_MODEL_ID",`
			`service_endpoint="https://inference.generativeai.us-chicago-1.oci.oraclecloud.com",`
			`compartment_id="MY_OCID"`
			`)`
			`"""`

			`class Config:`
			`"""Configuration for this pydantic object."""`

			`extra = Extra.forbid`

			`@property`
			`def _llm_type(self) -> str:`
			`"""Return type of llm."""`
			`return "oci"`

			`def _prepare_invocation_object(`
			`self, prompt: str, stop: Optional[List[str]], kwargs: Dict[str, Any]`
			`) -> Dict[str, Any]:`
			`from oci.generative_ai_inference import models`

			`oci_llm_request_mapping = {`
			`"cohere": models.CohereLlmInferenceRequest,`
			`"meta": models.LlamaLlmInferenceRequest,`
			`}`
			`provider = self._get_provider()`
			`_model_kwargs = self.model_kwargs or {}`
			`if stop is not None:`
			`_model_kwargs[self.llm_stop_sequence_mapping[provider]] = stop`

			`if self.model_id.startswith(CUSTOM_ENDPOINT_PREFIX):`
			`serving_mode = models.DedicatedServingMode(endpoint_id=self.model_id)`
			`else:`
			`serving_mode = models.OnDemandServingMode(model_id=self.model_id)`

			`inference_params = {_model_kwargs, kwargs}`
			`inference_params["prompt"] = prompt`
			`inference_params["is_stream"] = self.is_stream`

			`invocation_obj = models.GenerateTextDetails(`
			`compartment_id=self.compartment_id,`
			`serving_mode=serving_mode,`
			`inference_request=oci_llm_request_mapping[provider](**inference_params),`
			`)`

			`return invocation_obj`

			`def _process_response(self, response: Any, stop: Optional[List[str]]) -> str:`
			`provider = self._get_provider()`
			`if provider == "cohere":`
			`text = response.data.inference_response.generated_texts[0].text`
			`elif provider == "meta":`
			`text = response.data.inference_response.choices[0].text`
			`else:`
			`raise ValueError(f"Invalid provider: {provider}")`

			`if stop is not None:`
			`text = enforce_stop_tokens(text, stop)`

			`return text`

			`def _call(`
			`self,`
			`prompt: str,`
			`stop: Optional[List[str]] = None,`
			`run_manager: Optional[CallbackManagerForLLMRun] = None,`
			`**kwargs: Any,`
			`) -> str:`
			`"""Call out to OCIGenAI generate endpoint.`

			`Args:`
			`prompt: The prompt to pass into the model.`
			`stop: Optional list of stop words to use when generating.`

			`Returns:`
			`The string generated by the model.`

			`Example:`
			`.. code-block:: python`

			`response = llm.invoke("Tell me a joke.")`
			`"""`

			`invocation_obj = self._prepare_invocation_object(prompt, stop, kwargs)`
			`response = self.client.generate_text(invocation_obj)`
			`return self._process_response(response, stop)`