langchain/libs/community/langchain_community/tools/google_cloud/texttospeech.py

from __future__ import annotations

import tempfile
from typing import TYPE_CHECKING, Any, Optional

from langchain_core.callbacks import CallbackManagerForToolRun
from langchain_core.tools import BaseTool

from langchain_community.utilities.vertexai import get_client_info

if TYPE_CHECKING:
    from google.cloud import texttospeech


def _import_google_cloud_texttospeech() -> Any:
    try:
        from google.cloud import texttospeech
    except ImportError as e:
        raise ImportError(
            "Cannot import google.cloud.texttospeech, please install "
            "`pip install google-cloud-texttospeech`."
        ) from e
    return texttospeech


def _encoding_file_extension_map(encoding: texttospeech.AudioEncoding) -> Optional[str]:
    texttospeech = _import_google_cloud_texttospeech()

    ENCODING_FILE_EXTENSION_MAP = {
        texttospeech.AudioEncoding.LINEAR16: ".wav",
        texttospeech.AudioEncoding.MP3: ".mp3",
        texttospeech.AudioEncoding.OGG_OPUS: ".ogg",
        texttospeech.AudioEncoding.MULAW: ".wav",
        texttospeech.AudioEncoding.ALAW: ".wav",
    }
    return ENCODING_FILE_EXTENSION_MAP.get(encoding)


class GoogleCloudTextToSpeechTool(BaseTool):
    """Tool that queries the Google Cloud Text to Speech API.

    In order to set this up, follow instructions at:
    https://cloud.google.com/text-to-speech/docs/before-you-begin
    """

    name: str = "google_cloud_texttospeech"
    description: str = (
        "A wrapper around Google Cloud Text-to-Speech. "
        "Useful for when you need to synthesize audio from text. "
        "It supports multiple languages, including English, German, Polish, "
        "Spanish, Italian, French, Portuguese, and Hindi. "
    )

    _client: Any

    def __init__(self, **kwargs: Any) -> None:
        """Initializes private fields."""
        texttospeech = _import_google_cloud_texttospeech()

        super().__init__(**kwargs)

        self._client = texttospeech.TextToSpeechClient(
            client_info=get_client_info(module="text-to-speech")
        )

    def _run(
        self,
        input_text: str,
        language_code: str = "en-US",
        ssml_gender: Optional[texttospeech.SsmlVoiceGender] = None,
        audio_encoding: Optional[texttospeech.AudioEncoding] = None,
        run_manager: Optional[CallbackManagerForToolRun] = None,
    ) -> str:
        """Use the tool."""
        texttospeech = _import_google_cloud_texttospeech()
        ssml_gender = ssml_gender or texttospeech.SsmlVoiceGender.NEUTRAL
        audio_encoding = audio_encoding or texttospeech.AudioEncoding.MP3

        response = self._client.synthesize_speech(
            input=texttospeech.SynthesisInput(text=input_text),
            voice=texttospeech.VoiceSelectionParams(
                language_code=language_code, ssml_gender=ssml_gender
            ),
            audio_config=texttospeech.AudioConfig(audio_encoding=audio_encoding),
        )

        suffix = _encoding_file_extension_map(audio_encoding)

        with tempfile.NamedTemporaryFile(mode="bx", suffix=suffix, delete=False) as f:
            f.write(response.audio_content)
        return f.name
community[major], core[patch], langchain[patch], experimental[patch]: Create langchain-community (#14463) Moved the following modules to new package langchain-community in a backwards compatible fashion: ``` mv langchain/langchain/adapters community/langchain_community mv langchain/langchain/callbacks community/langchain_community/callbacks mv langchain/langchain/chat_loaders community/langchain_community mv langchain/langchain/chat_models community/langchain_community mv langchain/langchain/document_loaders community/langchain_community mv langchain/langchain/docstore community/langchain_community mv langchain/langchain/document_transformers community/langchain_community mv langchain/langchain/embeddings community/langchain_community mv langchain/langchain/graphs community/langchain_community mv langchain/langchain/llms community/langchain_community mv langchain/langchain/memory/chat_message_histories community/langchain_community mv langchain/langchain/retrievers community/langchain_community mv langchain/langchain/storage community/langchain_community mv langchain/langchain/tools community/langchain_community mv langchain/langchain/utilities community/langchain_community mv langchain/langchain/vectorstores community/langchain_community mv langchain/langchain/agents/agent_toolkits community/langchain_community mv langchain/langchain/cache.py community/langchain_community mv langchain/langchain/adapters community/langchain_community mv langchain/langchain/callbacks community/langchain_community/callbacks mv langchain/langchain/chat_loaders community/langchain_community mv langchain/langchain/chat_models community/langchain_community mv langchain/langchain/document_loaders community/langchain_community mv langchain/langchain/docstore community/langchain_community mv langchain/langchain/document_transformers community/langchain_community mv langchain/langchain/embeddings community/langchain_community mv langchain/langchain/graphs community/langchain_community mv langchain/langchain/llms community/langchain_community mv langchain/langchain/memory/chat_message_histories community/langchain_community mv langchain/langchain/retrievers community/langchain_community mv langchain/langchain/storage community/langchain_community mv langchain/langchain/tools community/langchain_community mv langchain/langchain/utilities community/langchain_community mv langchain/langchain/vectorstores community/langchain_community mv langchain/langchain/agents/agent_toolkits community/langchain_community mv langchain/langchain/cache.py community/langchain_community ``` Moved the following to core ``` mv langchain/langchain/utils/json_schema.py core/langchain_core/utils mv langchain/langchain/utils/html.py core/langchain_core/utils mv langchain/langchain/utils/strings.py core/langchain_core/utils cat langchain/langchain/utils/env.py >> core/langchain_core/utils/env.py rm langchain/langchain/utils/env.py ``` See .scripts/community_split/script_integrations.sh for all changes 2023-12-11 21:53:30 +00:00			`from __future__ import annotations`

			`import tempfile`
			`from typing import TYPE_CHECKING, Any, Optional`

			`from langchain_core.callbacks import CallbackManagerForToolRun`
			`from langchain_core.tools import BaseTool`

			`from langchain_community.utilities.vertexai import get_client_info`

			`if TYPE_CHECKING:`
			`from google.cloud import texttospeech`


			`def _import_google_cloud_texttospeech() -> Any:`
			`try:`
			`from google.cloud import texttospeech`
			`except ImportError as e:`
			`raise ImportError(`
			`"Cannot import google.cloud.texttospeech, please install "`
			"`pip install google-cloud-texttospeech`."
			`) from e`
			`return texttospeech`


			`def _encoding_file_extension_map(encoding: texttospeech.AudioEncoding) -> Optional[str]:`
			`texttospeech = _import_google_cloud_texttospeech()`

			`ENCODING_FILE_EXTENSION_MAP = {`
			`texttospeech.AudioEncoding.LINEAR16: ".wav",`
			`texttospeech.AudioEncoding.MP3: ".mp3",`
			`texttospeech.AudioEncoding.OGG_OPUS: ".ogg",`
			`texttospeech.AudioEncoding.MULAW: ".wav",`
			`texttospeech.AudioEncoding.ALAW: ".wav",`
			`}`
			`return ENCODING_FILE_EXTENSION_MAP.get(encoding)`


			`class GoogleCloudTextToSpeechTool(BaseTool):`
			`"""Tool that queries the Google Cloud Text to Speech API.`

			`In order to set this up, follow instructions at:`
			`https://cloud.google.com/text-to-speech/docs/before-you-begin`
			`"""`

			`name: str = "google_cloud_texttospeech"`
			`description: str = (`
			`"A wrapper around Google Cloud Text-to-Speech. "`
			`"Useful for when you need to synthesize audio from text. "`
			`"It supports multiple languages, including English, German, Polish, "`
			`"Spanish, Italian, French, Portuguese, and Hindi. "`
			`)`

			`_client: Any`

			`def __init__(self, **kwargs: Any) -> None:`
			`"""Initializes private fields."""`
			`texttospeech = _import_google_cloud_texttospeech()`

			`super().__init__(**kwargs)`

			`self._client = texttospeech.TextToSpeechClient(`
			`client_info=get_client_info(module="text-to-speech")`
			`)`

			`def _run(`
			`self,`
			`input_text: str,`
			`language_code: str = "en-US",`
			`ssml_gender: Optional[texttospeech.SsmlVoiceGender] = None,`
			`audio_encoding: Optional[texttospeech.AudioEncoding] = None,`
			`run_manager: Optional[CallbackManagerForToolRun] = None,`
			`) -> str:`
			`"""Use the tool."""`
			`texttospeech = _import_google_cloud_texttospeech()`
			`ssml_gender = ssml_gender or texttospeech.SsmlVoiceGender.NEUTRAL`
			`audio_encoding = audio_encoding or texttospeech.AudioEncoding.MP3`

			`response = self._client.synthesize_speech(`
			`input=texttospeech.SynthesisInput(text=input_text),`
			`voice=texttospeech.VoiceSelectionParams(`
			`language_code=language_code, ssml_gender=ssml_gender`
			`),`
			`audio_config=texttospeech.AudioConfig(audio_encoding=audio_encoding),`
			`)`

			`suffix = _encoding_file_extension_map(audio_encoding)`

			`with tempfile.NamedTemporaryFile(mode="bx", suffix=suffix, delete=False) as f:`
			`f.write(response.audio_content)`
			`return f.name`