Documentation Index
Fetch the complete documentation index at: https://agno-v2-shaloo-ai-support-link.mintlify.app/llms.txt
Use this file to discover all available pages before exploring further.
Agno supports audio as input to agents and teams. Take a look at the compatibility matrix to see which models support audio as input.
Let’s create an agent that can understand audio input.
import base64
import requests
from agno.agent import Agent, RunOutput # noqa
from agno.media import Audio
from agno.models.openai import OpenAIResponses
# Fetch the audio file and convert it to a base64 encoded string
url = "https://openaiassets.blob.core.windows.net/$web/API/docs/audio/alloy.wav"
response = requests.get(url)
response.raise_for_status()
wav_data = response.content
agent = Agent(
model=OpenAIResponses(id="gpt-5.2-audio-preview", modalities=["text"]),
markdown=True,
)
agent.print_response(
"What is in this audio?", audio=[Audio(content=wav_data, format="wav")]
)