coquiAPI

Build error

App Files Files Community

anuj-exe commited on Oct 7, 2025

Commit

71348b1

verified ·

1 Parent(s): c82872c

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -31

app.py CHANGED Viewed

@@ -3,18 +3,13 @@ from TTS.api import TTS
 import time
 import os
-# ------------------ Configuration ------------------
 YOURTTS_MODEL = "tts_models/multilingual/multi-dataset/your_tts"
 FIXED_SPEAKER_PATH = "speakers/voice2.wav"
-# Initialize model once
 tts = TTS(YOURTTS_MODEL, gpu=False)
-# ------------------ Core Synthesis Function ------------------
 def synthesize(text):
     output_path = "output.wav"
     start_time = time.time()
     if not os.path.exists(FIXED_SPEAKER_PATH):
         return None, {"error": f"❌ Speaker file not found: {FIXED_SPEAKER_PATH}"}
@@ -31,7 +26,6 @@ def synthesize(text):
     total_time = time.time() - start_time
     est_duration = len(text.split()) / 2.5
     rtf = round(total_time / est_duration, 3)
     return output_path, {
         "language": "English",
         "processing_time_sec": round(total_time, 3),
@@ -40,28 +34,15 @@ def synthesize(text):
         "speaker_used": os.path.basename(FIXED_SPEAKER_PATH)
     }
-# ------------------ Gradio UI + API ------------------
-with gr.Blocks() as demo:
-    gr.Markdown("## 🗣️ YourTTS Voice Cloning (English Only, Fixed Speaker)")
-    input_text = gr.Textbox(
-        label="Text",
-        placeholder="Type something to synthesize...",
-        lines=3
-    )
-    generate_btn = gr.Button("🔊 Generate Speech")
-    output_audio = gr.Audio(label="Output Audio", type="filepath")
-    metadata_json = gr.JSON(label="Meta Info (Time, Model, RTF, etc.)")
-    # This adds both UI and API under the same app
-    generate_btn.click(
-        fn=synthesize,
-        inputs=[input_text],
-        outputs=[output_audio, metadata_json],
-        api_name="/predict"   # <- this exposes the API endpoint
-    )
-# ------------------ Launch ------------------
-demo.launch(server_name="0.0.0.0", server_port=7860, show_api=True)

 import time
 import os
 YOURTTS_MODEL = "tts_models/multilingual/multi-dataset/your_tts"
 FIXED_SPEAKER_PATH = "speakers/voice2.wav"
 tts = TTS(YOURTTS_MODEL, gpu=False)
 def synthesize(text):
     output_path = "output.wav"
     start_time = time.time()
     if not os.path.exists(FIXED_SPEAKER_PATH):
         return None, {"error": f"❌ Speaker file not found: {FIXED_SPEAKER_PATH}"}
     total_time = time.time() - start_time
     est_duration = len(text.split()) / 2.5
     rtf = round(total_time / est_duration, 3)
     return output_path, {
         "language": "English",
         "processing_time_sec": round(total_time, 3),
         "speaker_used": os.path.basename(FIXED_SPEAKER_PATH)
     }
+# ✅ Define both the UI and API on the same Interface object
+demo = gr.Interface(
+    fn=synthesize,
+    inputs=[gr.Textbox(label="Text")],
+    outputs=[gr.Audio(type="filepath"), gr.JSON()],
+    title="YourTTS Voice Cloning (English Only, Fixed Speaker)",
+    allow_flagging="never"
+)
+demo.api_name = "/predict"  # ✅ explicit API name registration
+if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860, show_api=True)