First_agent_template

Sleeping

ressay1973 commited on Feb 20, 2025

Commit

0f96076

verified ·

1 Parent(s): dd7a51a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,10 +2,13 @@ from smolagents import CodeAgent, HfApiModel, load_tool, tool
 import datetime
 import pytz
 import yaml
-import whisper
 from tools.final_answer import FinalAnswerTool
 from Gradio_UI import GradioUI
 # Tool: Convert time between time zones
 @tool
 def convert_time(time_str: str, from_tz: str, to_tz: str) -> str:
@@ -46,7 +49,7 @@ def assign_alert(alert_message: str) -> str:
     return "Alert could not be assigned automatically. Please check manually."
-# Tool: Transcribe audio and generate a timeline
 @tool
 def transcribe_audio(audio_path: str) -> str:
     """Transcribe audio and log events with timestamps.
@@ -54,8 +57,7 @@ def transcribe_audio(audio_path: str) -> str:
         audio_path: Path to the audio file.
     """
     try:
-        model = whisper.load_model("base")
-        result = model.transcribe(audio_path)
         transcript = result["text"]
         timestamped_events = [f"{datetime.datetime.now().strftime('%Y-%m-%d %H:%M:%S')} - {line}" for line in transcript.split('.')]
         return "\n".join(timestamped_events)

 import datetime
 import pytz
 import yaml
+from transformers import pipeline
 from tools.final_answer import FinalAnswerTool
 from Gradio_UI import GradioUI
+# Initialize ASR model from Hugging Face
+asr_pipeline = pipeline("automatic-speech-recognition", model="facebook/wav2vec2-large-960h")
 # Tool: Convert time between time zones
 @tool
 def convert_time(time_str: str, from_tz: str, to_tz: str) -> str:
     return "Alert could not be assigned automatically. Please check manually."
+# Tool: Transcribe audio and generate a timeline using Hugging Face ASR
 @tool
 def transcribe_audio(audio_path: str) -> str:
     """Transcribe audio and log events with timestamps.
         audio_path: Path to the audio file.
     """
     try:
+        result = asr_pipeline(audio_path)
         transcript = result["text"]
         timestamped_events = [f"{datetime.datetime.now().strftime('%Y-%m-%d %H:%M:%S')} - {line}" for line in transcript.split('.')]
         return "\n".join(timestamped_events)