File size: 471 Bytes
73d4f3c
9aa985d
c7fc3b6
73d4f3c
 
9aa985d
14f424f
 
9aa985d
73d4f3c
 
14f424f
73d4f3c
9aa985d
91b1985
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
from services.gemini_client import get_gemini_client
from google.genai import types

async def speech_to_text(audio_bytes: bytes) -> str:
    client = get_gemini_client()

    # Correctly wrap audio bytes using types.File
    audio_file = types.File(data=audio_bytes, mime_type="audio/wav")

    response = client.models.generate_content(
        model="gemini-2.5-flash",
        contents=[audio_file]  # <-- pass as a list of types.File
    )

    return response.text