|
from langchain.agents import AgentType |
|
from langchain.llms import Together |
|
from langchain.tools import ElevenLabsText2SpeechTool |
|
from elevenlabs import set_api_key |
|
import gradio as gr |
|
|
|
|
|
set_api_key("866c88e3fe83f2b0de18226738445c8f") |
|
|
|
|
|
tts = ElevenLabsText2SpeechTool() |
|
|
|
|
|
llm = Together( |
|
model="mistralai/Mixtral-8x7B-Instruct-v0.1", |
|
temperature=0.7, |
|
max_tokens=128, |
|
top_k=1, |
|
together_api_key="f722a9f6e3afd6b9999e6aee02aeac9e751ea3a67b124c3667ab50c85c7fa99e" |
|
) |
|
|
|
|
|
tools = load_tools(["eleven_labs_text2speech"]) |
|
|
|
|
|
agent = initialize_agent( |
|
tools=tools, |
|
llm=llm, |
|
agent=AgentType.STRUCTURED_CHAT_ZERO_SHOT_REACT_DESCRIPTION, |
|
verbose=True |
|
) |
|
|
|
|
|
def generate_speech(text_to_speak): |
|
speech_file |
|
|