Generate text-to-speech using Agno agents integrated with Desivocal, that specializing in high-quality, multilingual text-to-speech (TTS) and voice cloning, with a particular emphasis on Indian and Western languages.
from agno.agent import Agentfrom agno.models.openai import OpenAIChatfrom agno.tools.desi_vocal import DesiVocalTools# ---------------------------------------------------------------------------# Create Agent# ---------------------------------------------------------------------------audio_agent = Agent( model=OpenAIChat(id="gpt-4o"), tools=[DesiVocalTools()], description="You are an AI agent that can generate audio using the DesiVocal API.", instructions=[ "When the user asks you to generate audio, use the `text_to_speech` tool to generate the audio.", "You'll generate the appropriate prompt to send to the tool to generate audio.", "You don't need to find the appropriate voice first, I already specified the voice to user.", "Return the audio file name in your response. Don't convert it to markdown.", "Generate the text prompt we send in hindi language", ], markdown=True,)# ---------------------------------------------------------------------------# Run Agent# ---------------------------------------------------------------------------if __name__ == "__main__": audio_agent.print_response( "Generate a very small audio of history of french revolution" )