Spaces:

MCP-1st-Birthday
/

MedLLM-Agent

Running on Zero

App Files Files Community

Y Phung Nguyen commited on 15 days ago

Commit

8515412

1 Parent(s): 9099c51

Show final answer not error msg if any

Browse files

Files changed (1) hide show

ui.py +50 -4

ui.py CHANGED Viewed

@@ -750,6 +750,7 @@ def create_demo():
                             request = MockRequest()
                     # Model is loaded, proceed with stream_chat (no model loading here to save time)
                     try:
                         for result in stream_chat(
                             message, history, system_prompt, temperature, max_new_tokens,
@@ -757,15 +758,60 @@ def create_demo():
                             use_rag, medical_model_name, use_web_search,
                             enable_clinical_intake, disable_agentic_reasoning, show_thoughts, request
                         ):
                             yield result
                     except Exception as e:
                         # Handle any errors gracefully
-                        logger.error(f"Error in stream_chat_with_model_check: {e}")
                         import traceback
                         logger.debug(f"Full traceback: {traceback.format_exc()}")
-                        error_msg = f"⚠️ An error occurred: {str(e)[:200]}"
-                        updated_history = history + [{"role": "assistant", "content": error_msg}]
-                        yield updated_history, ""
                 submit_button.click(
                     fn=stream_chat_with_model_check,

                             request = MockRequest()
                     # Model is loaded, proceed with stream_chat (no model loading here to save time)
+                    last_result = None
                     try:
                         for result in stream_chat(
                             message, history, system_prompt, temperature, max_new_tokens,
                             use_rag, medical_model_name, use_web_search,
                             enable_clinical_intake, disable_agentic_reasoning, show_thoughts, request
                         ):
+                            last_result = result
                             yield result
                     except Exception as e:
                         # Handle any errors gracefully
+                        error_str = str(e)
+                        error_msg_lower = error_str.lower()
+                        is_gpu_timeout = 'gpu task aborted' in error_msg_lower or 'timeout' in error_msg_lower
+                        logger.error(f"Error in stream_chat_with_model_check: {error_str}")
                         import traceback
                         logger.debug(f"Full traceback: {traceback.format_exc()}")
+                        # Check if we have a valid answer in the last result
+                        has_valid_answer = False
+                        if last_result is not None:
+                            try:
+                                last_history, last_thoughts = last_result
+                                # Find the last assistant message in the history
+                                if last_history and isinstance(last_history, list):
+                                    for msg in reversed(last_history):
+                                        if isinstance(msg, dict) and msg.get("role") == "assistant":
+                                            assistant_content = msg.get("content", "")
+                                            # Check if it's a valid answer (not empty, not an error message)
+                                            if assistant_content and len(assistant_content.strip()) > 0:
+                                                # Not an error message
+                                                if not assistant_content.strip().startswith("⚠️") and not assistant_content.strip().startswith("⏳"):
+                                                    has_valid_answer = True
+                                                    break
+                            except Exception as parse_error:
+                                logger.debug(f"Error parsing last_result: {parse_error}")
+                        # If we have a valid answer, use it (don't show error message)
+                        if has_valid_answer:
+                            logger.info(f"[UI] Error occurred but final answer already generated, displaying it without error message")
+                            yield last_result
+                            return
+                        # For GPU timeouts, try to use last result even if it's partial
+                        if is_gpu_timeout and last_result is not None:
+                            logger.info(f"[UI] GPU timeout occurred, using last available result")
+                            yield last_result
+                            return
+                        # Only show error for non-timeout errors when we have no valid answer
+                        # For GPU timeouts with no result, show empty message (not error)
+                        if is_gpu_timeout:
+                            logger.info(f"[UI] GPU timeout with no result, showing empty assistant message")
+                            updated_history = history + [{"role": "user", "content": message}, {"role": "assistant", "content": ""}]
+                            yield updated_history, ""
+                        else:
+                            # For other errors, show minimal error message only if no result
+                            error_display = f"⚠️ An error occurred: {error_str[:200]}"
+                            updated_history = history + [{"role": "user", "content": message}, {"role": "assistant", "content": error_display}]
+                            yield updated_history, ""
                 submit_button.click(
                     fn=stream_chat_with_model_check,