File size: 471 Bytes
73d4f3c 9aa985d c7fc3b6 73d4f3c 9aa985d 14f424f 9aa985d 73d4f3c 14f424f 73d4f3c 9aa985d 91b1985 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 | from services.gemini_client import get_gemini_client
from google.genai import types
async def speech_to_text(audio_bytes: bytes) -> str:
client = get_gemini_client()
# Correctly wrap audio bytes using types.File
audio_file = types.File(data=audio_bytes, mime_type="audio/wav")
response = client.models.generate_content(
model="gemini-2.5-flash",
contents=[audio_file] # <-- pass as a list of types.File
)
return response.text
|