mirror of
https://github.com/hwchase17/langchain.git
synced 2025-08-05 19:15:44 +00:00
Co-authored-by: Bagatur <baskaryan@gmail.com> Co-authored-by: Bagatur <22008038+baskaryan@users.noreply.github.com>
82 lines
2.7 KiB
Python
82 lines
2.7 KiB
Python
import tempfile
|
|
from enum import Enum
|
|
from typing import Any, Dict, Optional, Union
|
|
|
|
from langchain_core.callbacks import CallbackManagerForToolRun
|
|
from langchain_core.tools import BaseTool
|
|
from langchain_core.utils import get_from_dict_or_env
|
|
from pydantic import model_validator
|
|
|
|
|
|
def _import_elevenlabs() -> Any:
|
|
try:
|
|
import elevenlabs
|
|
except ImportError as e:
|
|
raise ImportError(
|
|
"Cannot import elevenlabs, please install `pip install elevenlabs`."
|
|
) from e
|
|
return elevenlabs
|
|
|
|
|
|
class ElevenLabsModel(str, Enum):
|
|
"""Models available for Eleven Labs Text2Speech."""
|
|
|
|
MULTI_LINGUAL = "eleven_multilingual_v1"
|
|
MONO_LINGUAL = "eleven_monolingual_v1"
|
|
|
|
|
|
class ElevenLabsText2SpeechTool(BaseTool): # type: ignore[override]
|
|
"""Tool that queries the Eleven Labs Text2Speech API.
|
|
|
|
In order to set this up, follow instructions at:
|
|
https://docs.elevenlabs.io/welcome/introduction
|
|
"""
|
|
|
|
model: Union[ElevenLabsModel, str] = ElevenLabsModel.MULTI_LINGUAL
|
|
|
|
name: str = "eleven_labs_text2speech"
|
|
description: str = (
|
|
"A wrapper around Eleven Labs Text2Speech. "
|
|
"Useful for when you need to convert text to speech. "
|
|
"It supports multiple languages, including English, German, Polish, "
|
|
"Spanish, Italian, French, Portuguese, and Hindi. "
|
|
)
|
|
|
|
@model_validator(mode="before")
|
|
@classmethod
|
|
def validate_environment(cls, values: Dict) -> Any:
|
|
"""Validate that api key exists in environment."""
|
|
_ = get_from_dict_or_env(values, "eleven_api_key", "ELEVEN_API_KEY")
|
|
|
|
return values
|
|
|
|
def _run(
|
|
self, query: str, run_manager: Optional[CallbackManagerForToolRun] = None
|
|
) -> str:
|
|
"""Use the tool."""
|
|
elevenlabs = _import_elevenlabs()
|
|
try:
|
|
speech = elevenlabs.generate(text=query, model=self.model)
|
|
with tempfile.NamedTemporaryFile(
|
|
mode="bx", suffix=".wav", delete=False
|
|
) as f:
|
|
f.write(speech)
|
|
return f.name
|
|
except Exception as e:
|
|
raise RuntimeError(f"Error while running ElevenLabsText2SpeechTool: {e}")
|
|
|
|
def play(self, speech_file: str) -> None:
|
|
"""Play the text as speech."""
|
|
elevenlabs = _import_elevenlabs()
|
|
with open(speech_file, mode="rb") as f:
|
|
speech = f.read()
|
|
|
|
elevenlabs.play(speech)
|
|
|
|
def stream_speech(self, query: str) -> None:
|
|
"""Stream the text as speech as it is generated.
|
|
Play the text in your speakers."""
|
|
elevenlabs = _import_elevenlabs()
|
|
speech_stream = elevenlabs.generate(text=query, model=self.model, stream=True)
|
|
elevenlabs.stream(speech_stream)
|