File size: 418 Bytes
73d4f3c
9aa985d
c7fc3b6
73d4f3c
 
9aa985d
544d113
14f424f
9aa985d
73d4f3c
 
544d113
73d4f3c
9aa985d
91b1985
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
from services.gemini_client import get_gemini_client
from google.genai import types

async def speech_to_text(audio_bytes: bytes) -> str:
    client = get_gemini_client()

    # Wrap audio bytes correctly
    audio_file = types.File(data=audio_bytes, mime_type="audio/wav")

    response = client.models.generate_content(
        model="gemini-2.5-flash",
        contents=[audio_file]
    )

    return response.text