Text-to-Speech and Speech-to-Text
from praisonaiagents import AudioAgent agent = AudioAgent(llm="openai/tts-1") agent.say("Hello!", output="hello.mp3")
from praisonaiagents import AudioAgent agent = AudioAgent(llm="openai/tts-1-hd") agent.speech("Hello!", voice="nova", speed=1.2, output="hello.mp3") # Voices: alloy, echo, fable, onyx, nova, shimmer
from praisonaiagents import AudioAgent agent = AudioAgent(llm="openai/whisper-1") text = agent.listen("audio.mp3") print(text)
from praisonaiagents import AudioAgent agent = AudioAgent(llm="groq/whisper-large-v3") # 10x faster text = agent.transcribe("audio.mp3", language="en") print(text)