Text-to-Speech
- Basic
- Advanced
Speech-to-Text
- Basic
- Advanced
Text-to-Speech and Speech-to-Text
from praisonaiagents import AudioAgent
agent = AudioAgent(llm="openai/tts-1")
agent.say("Hello!", output="hello.mp3")
from praisonaiagents import AudioAgent
agent = AudioAgent(llm="openai/tts-1-hd")
agent.speech("Hello!", voice="nova", speed=1.2, output="hello.mp3")
# Voices: alloy, echo, fable, onyx, nova, shimmer
from praisonaiagents import AudioAgent
agent = AudioAgent(llm="openai/whisper-1")
text = agent.listen("audio.mp3")
print(text)
from praisonaiagents import AudioAgent
agent = AudioAgent(llm="groq/whisper-large-v3") # 10x faster
text = agent.transcribe("audio.mp3", language="en")
print(text)