Spaces:

MCP-1st-Birthday
/

MedLLM-Agent

Running on Zero

App Files Files Community

Y Phung Nguyen commited on 15 days ago

Commit

ef40fb8

1 Parent(s): d99bfd8

Fix TTS player

Browse files

Files changed (1) hide show

ui.py +23 -7

ui.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """Gradio UI setup"""
 import time
 import gradio as gr
 import spaces
@@ -112,24 +113,39 @@ def create_demo():
                     outputs=[recording_timer, message_input]
                 )
-                with gr.Row(visible=False) as tts_row:
-                    tts_text = gr.Textbox(visible=False)
-                    tts_audio = gr.Audio(label="Generated Speech", visible=False)
                 def generate_speech_from_chat(history):
                     """Extract last assistant message and generate speech"""
                     if not history or len(history) == 0:
                         return None
                     last_msg = history[-1]
                     if last_msg.get("role") == "assistant":
                         text = last_msg.get("content", "").replace(" 🔊", "").strip()
                         if text:
-                            audio_path = generate_speech(text)
-                            return audio_path
                     return None
-                tts_button = gr.Button("🔊 Play Response", visible=False, size="sm")
                 def update_tts_button(history):
                     if history and len(history) > 0 and history[-1].get("role") == "assistant":
                         return gr.update(visible=True)

 """Gradio UI setup"""
+import os
 import time
 import gradio as gr
 import spaces
                     outputs=[recording_timer, message_input]
                 )
+                with gr.Row():
+                    tts_button = gr.Button("🔊 Play Response", visible=False, size="sm")
+                    tts_audio = gr.Audio(label="", visible=True, autoplay=True, show_label=False, container=False)
                 def generate_speech_from_chat(history):
                     """Extract last assistant message and generate speech"""
                     if not history or len(history) == 0:
+                        logger.warning("[TTS] No history available")
                         return None
                     last_msg = history[-1]
                     if last_msg.get("role") == "assistant":
                         text = last_msg.get("content", "").replace(" 🔊", "").strip()
                         if text:
+                            logger.info(f"[TTS] Generating speech for text: {text[:100]}...")
+                            try:
+                                audio_path = generate_speech(text)
+                                if audio_path and os.path.exists(audio_path):
+                                    logger.info(f"[TTS] ✅ Generated audio successfully: {audio_path}")
+                                    return audio_path
+                                else:
+                                    logger.warning(f"[TTS] ❌ Failed to generate audio or file doesn't exist: {audio_path}")
+                                    return None
+                            except Exception as e:
+                                logger.error(f"[TTS] Error generating speech: {e}")
+                                import traceback
+                                logger.debug(f"[TTS] Traceback: {traceback.format_exc()}")
+                                return None
+                        else:
+                            logger.warning("[TTS] Empty text extracted from assistant message")
+                    else:
+                        logger.warning(f"[TTS] Last message is not from assistant: {last_msg.get('role')}")
                     return None
                 def update_tts_button(history):
                     if history and len(history) > 0 and history[-1].get("role") == "assistant":
                         return gr.update(visible=True)