Flux is the first conversational speech recognition model built specifically for voice agents.
Flux (deepgram/flux) is a audio-stt model from Deepgram, released 2025-09-29. Pricing via AIgateway: $0.0077 per minute. Capabilities: streaming. Call it via https://api.aigateway.sh/v1/audio/transcriptions — set model="deepgram/flux". Best for: Meeting transcripts, Captions, Voice agents.
curl https://api.aigateway.sh/v1/audio/transcriptions \
-H "Authorization: Bearer $AIGATEWAY_API_KEY" \
-F model="deepgram/flux" \
-F file="@audio.mp3"// Realtime WebSocket. Browsers pass the key as ?api_key=
const ws = new WebSocket(
"wss://api.aigateway.sh/v1/realtime?model=deepgram/flux&encoding=linear16&sample_rate=16000&interim_results=true&api_key=" + AIGATEWAY_API_KEY,
);
ws.onmessage = (e) => {
const msg = JSON.parse(e.data);
if (msg.type === "Results") {
console.log(msg.channel.alternatives[0].transcript, msg.is_final);
}
};
// stream raw audio frames (linear16 PCM @ 16 kHz):
// ws.send(pcmChunk)
// ...then end the stream:
ws.send(JSON.stringify({ type: "CloseStream" }));# multipart/form-data — use curl -F or SDK file upload model="deepgram/flux" file=@audio.mp3 response_format=json # or "verbose_json", "text", "srt", "vtt" language=en # optional
{
"text": "Hello from AIgateway.",
"language": "en",
"duration": 1.82
}from openai import OpenAI
client = OpenAI(base_url="https://api.aigateway.sh/v1", api_key="sk-aig-...")
with open("audio.mp3", "rb") as f:
r = client.audio.transcriptions.create(model="deepgram/flux", file=f)
print(r.text)