Spaces:

MCP-1st-Birthday
/

mlops-agent

Running

App Files Files Community

Abid Ali Awan commited on 10 days ago

Commit

788acd9

1 Parent(s): 84cc41e

refactor: Revise system prompts and enhance output extraction in Gradio application to improve clarity, formatting, and user interaction during data operations, while streamlining the chat response process.

Browse files

Files changed (2) hide show

app.py +46 -86
test_streaming.py +105 -0

app.py CHANGED Viewed

@@ -5,6 +5,7 @@ CSV-based MLOps Agent with streaming final answer & MCP tools
 import os
 import shutil
 import gradio as gr
 from openai import OpenAI
@@ -32,33 +33,28 @@ MCP_TOOLS = [
 # Short prompts
 # -------------------------
-TOOL_SYSTEM_PROMPT = """
-You are an MLOps assistant with MCP tools for CSV analysis, training,
 evaluation, and deployment.
-If the user asks about data, datasets, CSVs, models, training,
-evaluation, or deployment, call MCP tools instead of guessing.
-Use the CSV file URL exactly as given when tools need a file path.
-Do not invent tool names or parameters.
-Keep internal reasoning hidden and reply briefly with technical details.
-"""
-FINAL_SYSTEM_PROMPT = """
-You are a helpful MLOps explainer and general assistant.
-You see the conversation plus a short technical summary of what tools did
-(if any). Explain in simple language what was done and what the results mean.
-Mention key metrics, model IDs, or endpoints if available.
-Suggest next steps briefly. For normal chat (no tools), just respond helpfully.
 Formatting rules:
-- Use Markdown.
-- Use bullet points for lists.
-- Wrap any commands or code (curl, bash, Python, JSON) in fenced code blocks:
-  ```bash
-  ...
-```
 """
@@ -87,21 +83,26 @@ def history_to_text(history) -> str:
 def extract_output_text(response) -> str:
     """
-    Extract plain text from a non-streaming Responses API call.
-    Fallback gracefully if the shape is unexpected.
     """
     try:
-        if response.output and len(response.output) > 0:
             first = response.output[0]
             if getattr(first, "content", None):
-                c0 = first.content[0]
-                text = getattr(c0, "text", None)
-                if text:
-                    return text
         # Fallback
-        return getattr(response, "output_text", None) or str(response)
-    except Exception:
-        return str(response)
 def handle_upload(file_path, request: gr.Request):
@@ -164,9 +165,8 @@ def chat_send_stream(user_msg, history, file_url):
     - If the user is just chatting (e.g., "hey"), respond directly
       with a streaming answer (no tools, no CSV required).
-    - If the user clearly asks for data/model operations, run:
-        Phase 1: non-stream tool phase via Responses API + MCP tools
-        Phase 2: streaming final answer via Responses API (no tools)
     - Keeps full chat history so follow-ups work.
     - Shows status/progress messages in the UI when tools are used.
     - Disables the textbox during work, re-enables at the end.
@@ -190,7 +190,7 @@ def chat_send_stream(user_msg, history, file_url):
     # -------------------------
     if not use_tools:
         # Add a small status bubble then stream
-        history.append({"role": "assistant", "content": "✏️ Generating answer..."})
         # Disable textbox while generating
         yield (
             history,
@@ -206,7 +206,7 @@ def chat_send_stream(user_msg, history, file_url):
         stream = client.responses.create(
             model=MODEL,
-            instructions=FINAL_SYSTEM_PROMPT,
             input=input_text,
             reasoning={"effort": "low"},
             stream=True,
@@ -256,15 +256,11 @@ def chat_send_stream(user_msg, history, file_url):
     # User message for the model includes the CSV URL
     user_with_file = f"[Uploaded CSV file URL: {file_url}]\n\n{user_msg}"
-    # -------------------------
-    # Phase 1: Tool + technical summary (non-streaming)
-    # -------------------------
     # Show a status message in UI
     history.append(
         {
             "role": "assistant",
-            "content": "⏳ Analyzing your request and selecting MCP tools...",
         }
     )
     # Disable textbox while tools run
@@ -273,63 +269,26 @@ def chat_send_stream(user_msg, history, file_url):
         gr.update(interactive=False),
     )
-    # Build a single string input for the tool phase
-    tool_phase_input = (
         (f"Conversation so far:\n{convo_before}\n\n" if convo_before else "")
         + "Latest user request (with file URL):\n"
         + user_with_file
-        + "\n\nYour task: decide which MCP tools to call and run them. "
-        "Then return a short technical summary of what you did and what the tools returned."
     )
-    tool_phase = client.responses.create(
         model=MODEL,
-        instructions=TOOL_SYSTEM_PROMPT,
-        input=tool_phase_input,
         tools=MCP_TOOLS,
         reasoning={"effort": "low"},
     )
-    scratchpad = extract_output_text(tool_phase).strip()
-    if not scratchpad:
-        scratchpad = "No MCP tool output was returned."
-    # Update status message to show tools finished
-    history[-1] = {
-        "role": "assistant",
-        "content": "✅ MCP tools finished. Preparing explanation...",
-    }
-    # Keep textbox disabled (we're about to stream final answer)
-    yield (
-        history,
-        gr.update(interactive=False),
-    )
-    # -------------------------
-    # Phase 2: Final streaming explanation
-    # -------------------------
-    # Replace last assistant message with streaming answer
     history[-1] = {"role": "assistant", "content": ""}
-    # Build a single string input for the final explanation phase
-    final_input = (
-        (f"Conversation so far:\n{convo_before}\n\n" if convo_before else "")
-        + "Latest user request (with file URL):\n"
-        + user_with_file
-        + "\n\nTechnical summary of tool actions and results:\n"
-        + scratchpad
-        + "\n\nNow explain this clearly to the user."
-    )
-    stream = client.responses.create(
-        model=MODEL,
-        instructions=FINAL_SYSTEM_PROMPT,
-        input=final_input,
-        reasoning={"effort": "low"},
-        stream=True,
-    )
     final_text = ""
     for event in stream:
         if event.type == "response.output_text.delta":
@@ -382,6 +341,7 @@ with gr.Blocks(title="Streaming MLOps Agent") as demo:
     chatbot = gr.Chatbot(
         label="Chat",
         render_markdown=True,
         avatar_images=(
             None,
             "https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.png",
@@ -403,7 +363,7 @@ with gr.Blocks(title="Streaming MLOps Agent") as demo:
 if __name__ == "__main__":
     demo.queue().launch(
-        theme=gr.themes.Default(primary_hue="blue", secondary_hue="green"),
         allowed_paths=["/tmp"],
         ssr_mode=False,
         show_error=True,

 import os
 import shutil
+import json
 import gradio as gr
 from openai import OpenAI
 # Short prompts
 # -------------------------
+MAIN_SYSTEM_PROMPT = """
+You are a helpful MLOps assistant with MCP tools for CSV analysis, training,
 evaluation, and deployment.
+For data-related requests (datasets, CSVs, models, training, evaluation,
+deployment), call MCP tools to get comprehensive natural language results.
+The tools will return detailed explanations you can share directly.
+For general chat (no data operations), respond helpfully and naturally.
+When using tools:
+- Use the CSV file URL exactly as provided
+- Do not invent tool parameters
+- Share the complete results from MCP tools
+- Add brief context or suggestions if helpful
+Keep responses clear, informative, and user-friendly.
 Formatting rules:
+- Use Markdown for formatting
+- Use bullet points for lists
+- Wrap code, commands, and JSON in fenced code blocks
 """
 def extract_output_text(response) -> str:
     """
+    Extract text from a non-streaming Responses API call while preserving formatting.
     """
     try:
+        if hasattr(response, 'output') and response.output and len(response.output) > 0:
             first = response.output[0]
             if getattr(first, "content", None):
+                for content_item in first.content:
+                    if hasattr(content_item, 'type') and content_item.type == "output_text":
+                        text = getattr(content_item, "text", None)
+                        if text:
+                            return text
+                    elif hasattr(content_item, 'type') and content_item.type == "output_json":
+                        # If there's JSON output, format it nicely
+                        json_data = getattr(content_item, 'json', None)
+                        if json_data:
+                            return f"```json\n{json.dumps(json_data, indent=2)}\n```"
         # Fallback
+        return getattr(response, 'output_text', None) or str(response)
+    except Exception as e:
+        return f"Error extracting output: {e}"
 def handle_upload(file_path, request: gr.Request):
     - If the user is just chatting (e.g., "hey"), respond directly
       with a streaming answer (no tools, no CSV required).
+    - If the user clearly asks for data/model operations:
+      Call API once with MCP tools and stream the natural language results directly
     - Keeps full chat history so follow-ups work.
     - Shows status/progress messages in the UI when tools are used.
     - Disables the textbox during work, re-enables at the end.
     # -------------------------
     if not use_tools:
         # Add a small status bubble then stream
+        history.append({"role": "assistant", "content": "Generating answer..."})
         # Disable textbox while generating
         yield (
             history,
         stream = client.responses.create(
             model=MODEL,
+            instructions=MAIN_SYSTEM_PROMPT,
             input=input_text,
             reasoning={"effort": "low"},
             stream=True,
     # User message for the model includes the CSV URL
     user_with_file = f"[Uploaded CSV file URL: {file_url}]\n\n{user_msg}"
     # Show a status message in UI
     history.append(
         {
             "role": "assistant",
+            "content": "Analyzing your request and running MCP tools...",
         }
     )
     # Disable textbox while tools run
         gr.update(interactive=False),
     )
+    # Build input for the tool phase (single call)
+    tool_input = (
         (f"Conversation so far:\n{convo_before}\n\n" if convo_before else "")
         + "Latest user request (with file URL):\n"
         + user_with_file
     )
+    # Single API call with tools - MCP returns natural language results
+    stream = client.responses.create(
         model=MODEL,
+        instructions=MAIN_SYSTEM_PROMPT,
+        input=tool_input,
         tools=MCP_TOOLS,
         reasoning={"effort": "low"},
+        stream=True,
     )
+    # Replace status message with streaming answer
     history[-1] = {"role": "assistant", "content": ""}
     final_text = ""
     for event in stream:
         if event.type == "response.output_text.delta":
     chatbot = gr.Chatbot(
         label="Chat",
         render_markdown=True,
+        height=500,
         avatar_images=(
             None,
             "https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.png",
 if __name__ == "__main__":
     demo.queue().launch(
+        theme=gr.themes.Soft(primary_hue="red", secondary_hue="pink"),
         allowed_paths=["/tmp"],
         ssr_mode=False,
         show_error=True,

test_streaming.py ADDED Viewed

	@@ -0,0 +1,105 @@

+#!/usr/bin/env python3
+"""
+Test the optimized single-phase streaming functionality
+"""
+import os
+import sys
+sys.path.append(os.path.dirname(os.path.abspath(__file__)))
+from app import MAIN_SYSTEM_PROMPT, MCP_TOOLS, client, MODEL
+def test_streaming_with_tools():
+    """
+    Test that the single-phase streaming works correctly
+    """
+    csv_url = "https://mcp-1st-birthday-mlops-agent.hf.space/gradio_api/file=/tmp/gradio/6abcca54f954f2ad99a8f8f330dc6e8082f03ef3090458d97c274efcc76d0170/heart.csv"
+    user_with_file = f"[Uploaded CSV file URL: {csv_url}]\n\nAnalyze this dataset and show me basic statistics"
+    print("Testing Single-Phase Streaming...")
+    print(f"Input: {user_with_file[:100]}...")
+    print("-" * 60)
+    stream = client.responses.create(
+        model=MODEL,
+        instructions=MAIN_SYSTEM_PROMPT,
+        input=user_with_file,
+        tools=MCP_TOOLS,
+        reasoning={"effort": "low"},
+        stream=True,
+    )
+    print("Streaming Response:")
+    print("=" * 60)
+    final_text = ""
+    chunk_count = 0
+    for event in stream:
+        if event.type == "response.output_text.delta":
+            chunk_count += 1
+            final_text += event.delta
+            print(f"[Chunk {chunk_count}] {event.delta[:50]}...")
+        elif event.type == "response.completed":
+            print("=" * 60)
+            print(f"Total chunks: {chunk_count}")
+            print(f"Total length: {len(final_text)} characters")
+            print("FINAL RESPONSE:")
+            print(final_text)
+            break
+    return final_text
+def test_streaming_without_tools():
+    """
+    Test that regular streaming works for non-tool requests
+    """
+    print("\nTesting Regular Streaming (No Tools)...")
+    print("-" * 60)
+    stream = client.responses.create(
+        model=MODEL,
+        instructions=MAIN_SYSTEM_PROMPT,
+        input="Hello! Can you explain what MLOps is in simple terms?",
+        reasoning={"effort": "low"},
+        stream=True,
+    )
+    print("Streaming Response:")
+    print("=" * 60)
+    final_text = ""
+    chunk_count = 0
+    for event in stream:
+        if event.type == "response.output_text.delta":
+            chunk_count += 1
+            final_text += event.delta
+            print(f"[Chunk {chunk_count}] {event.delta[:50]}...")
+        elif event.type == "response.completed":
+            print("=" * 60)
+            print(f"Total chunks: {chunk_count}")
+            print(f"Total length: {len(final_text)} characters")
+            print("FINAL RESPONSE:")
+            print(final_text)
+            break
+    return final_text
+if __name__ == "__main__":
+    print("Starting Streaming Tests")
+    print("=" * 60)
+    # Test 1: With MCP tools
+    response1 = test_streaming_with_tools()
+    # Test 2: Without tools
+    response2 = test_streaming_without_tools()
+    print("\n" + "=" * 60)
+    print("✅ Both streaming tests completed successfully!")
+    print("✅ Single-phase approach working correctly!")
+    print("✅ MCP tools returning natural language responses!")
+    print("✅ Response is properly streaming in chunks!")
+    print("=" * 60)