Spaces:

MCP-1st-Birthday
/

mlops-agent

Running

App Files Files Community

Abid Ali Awan commited on 10 days ago

Commit

693bdb2

1 Parent(s): 45bd7ce

refactor: Revamp Gradio MCP Connector to enhance performance and user experience by implementing a two-phase chat process with tool resolution and streaming responses, updating the system prompt for clarity, and improving file upload handling.

Browse files

Files changed (2) hide show

app.py +130 -323
todolist.md +5 -0

app.py CHANGED Viewed

@@ -1,379 +1,186 @@
 """
-Gradio MCP Client for Remote MCP Server - With File Upload
 """
-import json
 import os
 import shutil
-import warnings
-from contextlib import asynccontextmanager
 import gradio as gr
-from fastmcp import Client
-from fastmcp.client.transports import StreamableHttpTransport
 from openai import OpenAI
-# Suppress deprecation warnings
-warnings.filterwarnings(
-    "ignore", category=DeprecationWarning, module="websockets.legacy"
-)
-warnings.filterwarnings(
-    "ignore", category=DeprecationWarning, module="uvicorn.protocols.websockets"
-)
-# Import orchestrator functions (if available)
-try:
-    from orchestrator import run_orchestrated_chat, run_orchestrated_chat_stream
-except ImportError:
-    # Fallback if orchestrator module not found
-    run_orchestrated_chat = None
-    run_orchestrated_chat_stream = None
-# Configuration
-MCP_SERVER_URL = "https://mcp-1st-birthday-auto-deployer.hf.space/gradio_api/mcp/"
 OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
-MODEL = "gpt-5-mini"
-# Will be set when app launches
-APP_URL = None
-class MCPClientManager:
-    def __init__(self, server_url: str):
-        self.server_url = server_url
-    @asynccontextmanager
-    async def get_client(self):
-        transport = StreamableHttpTransport(self.server_url)
-        async with Client(transport) as client:
-            yield client
-    async def get_tools(self) -> list:
-        async with self.get_client() as client:
-            return await client.list_tools()
-    async def call_tool(self, tool_name: str, arguments: dict) -> str:
-        async with self.get_client() as client:
-            result = await client.call_tool(tool_name, arguments)
-            if hasattr(result, "content"):
-                if isinstance(result.content, list):
-                    return "\n".join(
-                        str(item.text) if hasattr(item, "text") else str(item)
-                        for item in result.content
-                    )
-                return str(result.content)
-            return str(result)
-    def to_openai_tools(self, tools: list) -> list:
-        return [
-            {
-                "type": "function",
-                "function": {
-                    "name": tool.name,
-                    "description": tool.description or "",
-                    "parameters": {
-                        "type": "object",
-                        "properties": tool.inputSchema.get("properties", {})
-                        if tool.inputSchema
-                        else {},
-                        "required": tool.inputSchema.get("required", [])
-                        if tool.inputSchema
-                        else [],
-                    },
-                },
-            }
-            for tool in tools
-        ]
-mcp = MCPClientManager(MCP_SERVER_URL)
-openai_client = OpenAI(api_key=OPENAI_API_KEY)
-SYSTEM_PROMPT = """You are a helpful ML assistant with access to Auto Deployer tools.
-IMPORTANT: When calling tools with file_path parameter:
-- Use the provided file URL directly
-- Pass ONLY the raw URL (e.g., "https://...")
-- Never add prefixes like "Gradio File Input - "
-Always pass URLs directly without any prefix."""
-async def chat(message: str, history: list, file_url: str):
-    """Process chat with optional file URL"""
-    tools = await mcp.get_tools()
-    openai_tools = mcp.to_openai_tools(tools)
-    messages = [{"role": "system", "content": SYSTEM_PROMPT}]
-    # Add file context if available
-    user_content = message
-    if file_url:
-        user_content = f"[Uploaded CSV file URL: {file_url}]\n\n{message}"
-    # Build history
-    for item in history:
-        if isinstance(item, (list, tuple)) and len(item) == 2:
-            user_msg, assistant_msg = item
-            messages.append({"role": "user", "content": user_msg})
-            if assistant_msg:
-                messages.append({"role": "assistant", "content": assistant_msg})
-    messages.append({"role": "user", "content": user_content})
-    # First call
-    response = openai_client.chat.completions.create(
-        model=MODEL,
-        messages=messages,
-        tools=openai_tools,
-        tool_choice="auto",
-    )
-    assistant_message = response.choices[0].message
-    # Handle tool calls
-    while assistant_message.tool_calls:
-        messages.append(assistant_message)
-        yield "🔧 Calling tools...\n\n"
-        for tool_call in assistant_message.tool_calls:
-            tool_name = tool_call.function.name
-            arguments = json.loads(tool_call.function.arguments)
-            # Clean file_path
-            if "file_path" in arguments:
-                fp = arguments["file_path"]
-                if fp.startswith("Gradio File Input - "):
-                    arguments["file_path"] = fp.replace("Gradio File Input - ", "")
-            yield f"⚙️ Running `{tool_name}`...\n\n"
-            try:
-                tool_result = await mcp.call_tool(tool_name, arguments)
-            except Exception as e:
-                tool_result = f"Error: {e}"
-            messages.append(
-                {
-                    "role": "tool",
-                    "tool_call_id": tool_call.id,
-                    "content": tool_result,
-                }
-            )
-        response = openai_client.chat.completions.create(
-            model=MODEL,
-            messages=messages,
-            tools=openai_tools,
-            tool_choice="auto",
-        )
-        assistant_message = response.choices[0].message
-    # Stream final response
-    stream = openai_client.chat.completions.create(
-        model=MODEL,
-        messages=messages,
-        stream=True,
-    )
-    partial_response = ""
-    for chunk in stream:
-        if chunk.choices[0].delta.content:
-            partial_response += chunk.choices[0].delta.content
-            yield partial_response
 def handle_upload(file_obj, request: gr.Request):
-    """
-    1) Take uploaded file
-    2) Copy to /tmp for a stable path
-    3) Build a public gradio file URL
-    """
     if file_obj is None:
-        return None, None
-    # Local path where Gradio stored the file
     local_path = file_obj.name
-    # Optional: stabilize path under /tmp
     stable_path = os.path.join("/tmp", os.path.basename(local_path))
     try:
         shutil.copy(local_path, stable_path)
         local_path = stable_path
     except Exception:
-        # If copy fails, use original path
         pass
-    # Use Gradio's internal file URL format
-    base_url = str(request.base_url).rstrip('/')
-    public_url = f"{base_url}/gradio_api/file={local_path}"
-    return public_url, public_url
-async def chat_send_stream(user_msg, history, file_url):
     """
-    Streaming chat function that yields updates including tool invocations.
-    - history: list of message dictionaries with 'role' and 'content' keys
-    - file_url: required HTTP URL to the uploaded file
     """
     if history is None:
         history = []
-    # Ensure history is in proper dict format
-    messages = []
-    for item in history:
-        if isinstance(item, dict) and "role" in item and "content" in item:
-            messages.append(item)
-        elif isinstance(item, (list, tuple)) and len(item) == 2:
-            user_msg_item, assistant_msg_item = item
-            messages.append({"role": "user", "content": str(user_msg_item)})
-            if assistant_msg_item:
-                messages.append({"role": "assistant", "content": str(assistant_msg_item)})
-    # Add current user message
-    messages.append({"role": "user", "content": user_msg})
-    # Add thinking placeholder
-    messages.append({"role": "assistant", "content": "🤔 Thinking..."})
-    # If no file, respond with error
-    if not file_url:
-        messages[-1] = {"role": "assistant", "content": "Upload a file first."}
-        yield messages
-        return
-    # Use orchestrator if available
-    if run_orchestrated_chat_stream:
-        # Convert to tuple format for orchestrator (excluding current thinking message)
-        history_tuples = []
-        for item in messages[:-1]:
-            if item["role"] == "user":
-                history_tuples.append((item.get("content", ""), ""))
-            elif item["role"] == "assistant":
-                if history_tuples:
-                    history_tuples[-1] = (history_tuples[-1][0], item.get("content", ""))
-        # Stream the response using async generator
-        async for chunk in run_orchestrated_chat_stream(
-            user_msg, history_tuples, file_url
-        ):
-            chunk_type = chunk.get("type", "")
-            chunk_content = chunk.get("content", "")
-            if chunk_type == "thinking":
-                messages[-1] = {"role": "assistant", "content": chunk_content}
-                yield messages
-            elif chunk_type == "tool":
-                messages[-1] = {"role": "assistant", "content": messages[-1]["content"] + f"\n{chunk_content}"}
-                yield messages
-            elif chunk_type == "result":
-                messages[-1] = {"role": "assistant", "content": messages[-1]["content"] + f"\n{chunk_content}"}
-                yield messages
-            elif chunk_type == "final":
-                messages[-1] = {"role": "assistant", "content": chunk_content}
-                yield messages
-            elif chunk_type == "error":
-                messages[-1] = {"role": "assistant", "content": chunk_content}
-                yield messages
     else:
-        # Fallback: use the existing chat function with streaming
-        simple_history = [item for item in messages[:-1] if item["role"] in ["user", "assistant"]]
-        response_text = ""
-        async for chunk in chat(user_msg, simple_history, file_url):
-            response_text = chunk
-            messages[-1] = {"role": "assistant", "content": response_text}
-            yield messages
-with gr.Blocks(title="MCP + GPT-5 mini - Streaming Chat") as demo:
-    gr.Markdown(
-        """
-        # AI-Driven MLOps Agent 🤖
-        - **Upload a CSV file** (required)
-        - Real-time streaming with live tool invocations
-        - Get intelligent insights, training, or deployment based on your needs
-        """
     )
-    uploader = gr.File(
-        label="Required CSV file upload",
-        file_count="single",
-        type="filepath",
-        file_types=[".csv"],  # Restrict to CSV files only
-    )
-    # Internal file URL storage (hidden from UI)
-    file_url_state = gr.State(value=None)
-    # Use message format for better streaming support
-    chatbot = gr.Chatbot(
-        label="Chat",
-        avatar_images=(
-            None,
-            "https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.png",
-        ),
     )
-    msg = gr.Textbox(label="Message", interactive=True)
-    send = gr.Button("Send", interactive=True)
-    # When file changes, generate URL and update state
-    uploader.change(
-        handle_upload,
-        inputs=[uploader],
-        outputs=[file_url_state],
-    )
-    # Send button (streaming) - update chatbot and clear input
     send.click(
         chat_send_stream,
-        inputs=[msg, chatbot, file_url_state],
         outputs=[chatbot],
     ).then(lambda: "", outputs=[msg])
-    # Press Enter to send (streaming) - update chatbot and clear input
     msg.submit(
         chat_send_stream,
-        inputs=[msg, chatbot, file_url_state],
         outputs=[chatbot],
     ).then(lambda: "", outputs=[msg])
-async def test_mcp_connection():
-    """Test MCP connection on startup"""
-    try:
-        print("Testing MCP server connection...")
-        tools = await mcp.get_tools()
-        print(f"✅ Connected to MCP server. Found {len(tools)} tools.")
-        return True
-    except Exception as e:
-        print(f"❌ Failed to connect to MCP server: {e}")
-        return False
 if __name__ == "__main__":
-    import asyncio
-    import warnings
-    # Suppress all warnings for cleaner output
-    warnings.filterwarnings("ignore")
-    # Test MCP connection on startup
-    try:
-        print(f"Attempting to connect to MCP server: {MCP_SERVER_URL}")
-        asyncio.run(test_mcp_connection())
-    except Exception as e:
-        print(f"MCP connection test failed: {e}")
-        print("Continuing anyway - connection will be retried during chat...")
-    # Launch the app
     demo.queue().launch(
         allowed_paths=["/tmp"],
-        ssr_mode=False,
         show_error=True,
         quiet=True,
     )

 """
+Gradio + OpenAI MCP Connector — Clean, Fast, Streaming, With File Upload
 """
 import os
 import shutil
 import gradio as gr
 from openai import OpenAI
+# ---------------------
+# CONFIGURATION
+# ---------------------
 OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
+MCP_SERVER_URL = "https://mcp-1st-birthday-auto-deployer.hf.space/gradio_api/mcp/"
+MODEL_FAST = "gpt-5-mini"  # for tool resolution
+MODEL_STREAM = "gpt-5.1"  # for final streaming reply
+client = OpenAI(api_key=OPENAI_API_KEY)
+SYSTEM_PROMPT = """
+You are a fast MLOps assistant with access to remote MCP tools.
+Use tools only when necessary.
+Keep reasoning effort LOW for speed.
+After tools run, summarize clearly and concisely.
+"""
+# ---------------------
+# NATIVE MCP CONNECTOR
+# ---------------------
+TOOLS = [
+    {
+        "type": "mcp",
+        "server_label": "deploy_tools",
+        "server_url": MCP_SERVER_URL,
+        # transport auto-detected; HF space supports HTTP
+    }
+]
+# ---------------------
+# FILE UPLOAD HANDLER
+# ---------------------
 def handle_upload(file_obj, request: gr.Request):
     if file_obj is None:
+        return None
+    # Ensure file is in a stable path
     local_path = file_obj.name
     stable_path = os.path.join("/tmp", os.path.basename(local_path))
     try:
         shutil.copy(local_path, stable_path)
         local_path = stable_path
     except Exception:
         pass
+    # Build public Gradio URL
+    base = str(request.base_url).rstrip("/")
+    return f"{base}/gradio_api/file={local_path}"
+# ---------------------
+# MAIN CHAT HANDLER
+# ---------------------
+def chat_send_stream(user_msg, history, file_url):
     """
+    2-phase pipeline:
+        PHASE 1 ➜ Non-streaming tool resolution using gpt-5-mini
+        PHASE 2 ➜ Streaming final output using gpt-5
     """
     if history is None:
         history = []
+    # Build message history for OpenAI
+    messages = [{"role": "system", "content": SYSTEM_PROMPT}]
+    for u, a in history:
+        messages.append({"role": "user", "content": u})
+        if a:
+            messages.append({"role": "assistant", "content": a})
+    # Inject file context
+    if file_url:
+        user_msg_full = f"[Uploaded CSV file: {file_url}]\n\n{user_msg}"
     else:
+        user_msg_full = user_msg
+    messages.append({"role": "user", "content": user_msg_full})
+    # -----------------------------
+    # PHASE 1 — TOOL RESOLUTION
+    # -----------------------------
+    tool_phase = client.responses.create(
+        model=MODEL_FAST,
+        reasoning={"effort": "low"},
+        tools=TOOLS,
+        instructions=SYSTEM_PROMPT,
+        input=messages,
     )
+    tool_feedback = []
+    # Detect tool calls (if any)
+    if tool_phase.output:
+        for item in tool_phase.output:
+            if item.type == "tool_call":
+                tool_feedback.append(f"🛠️ Used tool `{item.name}`.")
+            elif item.type == "tool_result":
+                tool_feedback.append(f"{item.content}")
+        if not tool_feedback:
+            tool_feedback.append("No MCP tools needed.")
+    else:
+        tool_feedback.append("No MCP tools needed.")
+    # Append tool results to messages before final generation
+    messages.append({"role": "assistant", "content": "\n".join(tool_feedback)})
+    # Yield intermediate tool feedback to the UI
+    history.append((user_msg, "\n".join(tool_feedback)))
+    yield history
+    # -----------------------------
+    # PHASE 2 — STREAMING FINAL ANSWER
+    # -----------------------------
+    stream = client.responses.create(
+        model=MODEL_STREAM,
+        reasoning={"effort": "low"},
+        instructions=SYSTEM_PROMPT,
+        input=messages,
+        stream=True,
     )
+    final_text = ""
+    for ev in stream:
+        if ev.type == "response.output_text.delta":
+            final_text += ev.delta
+            history[-1] = (user_msg, "\n".join(tool_feedback) + "\n\n" + final_text)
+            yield history
+        elif ev.type == "response.completed":
+            break
+    stream.close()
+# ---------------------
+# GRADIO UI
+# ---------------------
+with gr.Blocks(title="MCP + GPT-5 — Fast Streaming MLOps Agent") as demo:
+    gr.Markdown("""
+    # 🚀 AI-Driven MLOps Agent (MCP-Powered)
+    - Upload a CSV file
+    - Tools resolve instantly
+    - Final answer streams smoothly
+    """)
+    file_state = gr.State()
+    uploader = gr.File(label="Upload CSV file", type="filepath", file_count="single")
+    uploader.change(handle_upload, inputs=[uploader], outputs=[file_state])
+    chatbot = gr.Chatbot(label="Chat")
+    msg = gr.Textbox(label="Message")
+    send = gr.Button("Send")
     send.click(
         chat_send_stream,
+        inputs=[msg, chatbot, file_state],
         outputs=[chatbot],
     ).then(lambda: "", outputs=[msg])
     msg.submit(
         chat_send_stream,
+        inputs=[msg, chatbot, file_state],
         outputs=[chatbot],
     ).then(lambda: "", outputs=[msg])
 if __name__ == "__main__":
     demo.queue().launch(
         allowed_paths=["/tmp"],
         show_error=True,
         quiet=True,
     )

todolist.md ADDED Viewed

	@@ -0,0 +1,5 @@

+- [] Diable message and send button while the final reosne is not recived.
+- [] reduce the thinking preces in tools secaltiona dn then analysing the dataset.
+- [] clear the message when user end the message.
+- [] model is not taking an acocunt of previous ocnverations.
+- [] add more infor to the readme