Spaces:

zade-frontier
/

andrej-karpathy-llm-council

Running

App Files Files Community

burtenshaw HF Staff commited on 17 days ago

Commit

ab1b163

1 Parent(s): b569680

Upload folder using huggingface_hub

Browse files

Files changed (12) hide show

backend/__init__.py +1 -0
backend/__pycache__/__init__.cpython-310.pyc +0 -0
backend/__pycache__/config.cpython-310.pyc +0 -0
backend/__pycache__/council.cpython-310.pyc +0 -0
backend/__pycache__/debug_models.cpython-310.pyc +0 -0
backend/__pycache__/openrouter.cpython-310.pyc +0 -0
backend/config.py +26 -0
backend/council.py +335 -0
backend/debug_models.py +24 -0
backend/main.py +199 -0
backend/openrouter.py +79 -0
backend/storage.py +172 -0

backend/__init__.py ADDED Viewed

	@@ -0,0 +1 @@


1	+ """LLM Council backend package."""

backend/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (180 Bytes). View file

backend/__pycache__/config.cpython-310.pyc ADDED Viewed

Binary file (549 Bytes). View file

backend/__pycache__/council.cpython-310.pyc ADDED Viewed

Binary file (8.46 kB). View file

backend/__pycache__/debug_models.cpython-310.pyc ADDED Viewed

Binary file (883 Bytes). View file

backend/__pycache__/openrouter.cpython-310.pyc ADDED Viewed

Binary file (2.46 kB). View file

backend/config.py ADDED Viewed

	@@ -0,0 +1,26 @@

+"""Configuration for the LLM Council."""
+import os
+from dotenv import load_dotenv
+load_dotenv()
+# OpenRouter API key
+OPENROUTER_API_KEY = os.getenv("OPENROUTER_API_KEY")
+# Council members - list of OpenRouter model identifiers
+COUNCIL_MODELS = [
+    "openai/gpt-5.1",
+    "google/gemini-3-pro-preview",
+    "anthropic/claude-sonnet-4.5",
+    "x-ai/grok-4",
+]
+# Chairman model - synthesizes final response
+CHAIRMAN_MODEL = "google/gemini-3-pro-preview"
+# OpenRouter API endpoint
+OPENROUTER_API_URL = "https://openrouter.ai/api/v1/chat/completions"
+# Data directory for conversation storage
+DATA_DIR = "data/conversations"

backend/council.py ADDED Viewed

	@@ -0,0 +1,335 @@

+"""3-stage LLM Council orchestration."""
+from typing import List, Dict, Any, Tuple
+from .openrouter import query_models_parallel, query_model
+from .config import COUNCIL_MODELS, CHAIRMAN_MODEL
+async def stage1_collect_responses(user_query: str) -> List[Dict[str, Any]]:
+    """
+    Stage 1: Collect individual responses from all council models.
+    Args:
+        user_query: The user's question
+    Returns:
+        List of dicts with 'model' and 'response' keys
+    """
+    messages = [{"role": "user", "content": user_query}]
+    # Query all models in parallel
+    responses = await query_models_parallel(COUNCIL_MODELS, messages)
+    # Format results
+    stage1_results = []
+    for model, response in responses.items():
+        if response is not None:  # Only include successful responses
+            stage1_results.append({
+                "model": model,
+                "response": response.get('content', '')
+            })
+    return stage1_results
+async def stage2_collect_rankings(
+    user_query: str,
+    stage1_results: List[Dict[str, Any]]
+) -> Tuple[List[Dict[str, Any]], Dict[str, str]]:
+    """
+    Stage 2: Each model ranks the anonymized responses.
+    Args:
+        user_query: The original user query
+        stage1_results: Results from Stage 1
+    Returns:
+        Tuple of (rankings list, label_to_model mapping)
+    """
+    # Create anonymized labels for responses (Response A, Response B, etc.)
+    labels = [chr(65 + i) for i in range(len(stage1_results))]  # A, B, C, ...
+    # Create mapping from label to model name
+    label_to_model = {
+        f"Response {label}": result['model']
+        for label, result in zip(labels, stage1_results)
+    }
+    # Build the ranking prompt
+    responses_text = "\n\n".join([
+        f"Response {label}:\n{result['response']}"
+        for label, result in zip(labels, stage1_results)
+    ])
+    ranking_prompt = f"""You are evaluating different responses to the following question:
+Question: {user_query}
+Here are the responses from different models (anonymized):
+{responses_text}
+Your task:
+1. First, evaluate each response individually. For each response, explain what it does well and what it does poorly.
+2. Then, at the very end of your response, provide a final ranking.
+IMPORTANT: Your final ranking MUST be formatted EXACTLY as follows:
+- Start with the line "FINAL RANKING:" (all caps, with colon)
+- Then list the responses from best to worst as a numbered list
+- Each line should be: number, period, space, then ONLY the response label (e.g., "1. Response A")
+- Do not add any other text or explanations in the ranking section
+Example of the correct format for your ENTIRE response:
+Response A provides good detail on X but misses Y...
+Response B is accurate but lacks depth on Z...
+Response C offers the most comprehensive answer...
+FINAL RANKING:
+1. Response C
+2. Response A
+3. Response B
+Now provide your evaluation and ranking:"""
+    messages = [{"role": "user", "content": ranking_prompt}]
+    # Get rankings from all council models in parallel
+    responses = await query_models_parallel(COUNCIL_MODELS, messages)
+    # Format results
+    stage2_results = []
+    for model, response in responses.items():
+        if response is not None:
+            full_text = response.get('content', '')
+            parsed = parse_ranking_from_text(full_text)
+            stage2_results.append({
+                "model": model,
+                "ranking": full_text,
+                "parsed_ranking": parsed
+            })
+    return stage2_results, label_to_model
+async def stage3_synthesize_final(
+    user_query: str,
+    stage1_results: List[Dict[str, Any]],
+    stage2_results: List[Dict[str, Any]]
+) -> Dict[str, Any]:
+    """
+    Stage 3: Chairman synthesizes final response.
+    Args:
+        user_query: The original user query
+        stage1_results: Individual model responses from Stage 1
+        stage2_results: Rankings from Stage 2
+    Returns:
+        Dict with 'model' and 'response' keys
+    """
+    # Build comprehensive context for chairman
+    stage1_text = "\n\n".join([
+        f"Model: {result['model']}\nResponse: {result['response']}"
+        for result in stage1_results
+    ])
+    stage2_text = "\n\n".join([
+        f"Model: {result['model']}\nRanking: {result['ranking']}"
+        for result in stage2_results
+    ])
+    chairman_prompt = f"""You are the Chairman of an LLM Council. Multiple AI models have provided responses to a user's question, and then ranked each other's responses.
+Original Question: {user_query}
+STAGE 1 - Individual Responses:
+{stage1_text}
+STAGE 2 - Peer Rankings:
+{stage2_text}
+Your task as Chairman is to synthesize all of this information into a single, comprehensive, accurate answer to the user's original question. Consider:
+- The individual responses and their insights
+- The peer rankings and what they reveal about response quality
+- Any patterns of agreement or disagreement
+Provide a clear, well-reasoned final answer that represents the council's collective wisdom:"""
+    messages = [{"role": "user", "content": chairman_prompt}]
+    # Query the chairman model
+    response = await query_model(CHAIRMAN_MODEL, messages)
+    if response is None:
+        # Fallback if chairman fails
+        return {
+            "model": CHAIRMAN_MODEL,
+            "response": "Error: Unable to generate final synthesis."
+        }
+    return {
+        "model": CHAIRMAN_MODEL,
+        "response": response.get('content', '')
+    }
+def parse_ranking_from_text(ranking_text: str) -> List[str]:
+    """
+    Parse the FINAL RANKING section from the model's response.
+    Args:
+        ranking_text: The full text response from the model
+    Returns:
+        List of response labels in ranked order
+    """
+    import re
+    # Look for "FINAL RANKING:" section
+    if "FINAL RANKING:" in ranking_text:
+        # Extract everything after "FINAL RANKING:"
+        parts = ranking_text.split("FINAL RANKING:")
+        if len(parts) >= 2:
+            ranking_section = parts[1]
+            # Try to extract numbered list format (e.g., "1. Response A")
+            # This pattern looks for: number, period, optional space, "Response X"
+            numbered_matches = re.findall(r'\d+\.\s*Response [A-Z]', ranking_section)
+            if numbered_matches:
+                # Extract just the "Response X" part
+                return [re.search(r'Response [A-Z]', m).group() for m in numbered_matches]
+            # Fallback: Extract all "Response X" patterns in order
+            matches = re.findall(r'Response [A-Z]', ranking_section)
+            return matches
+    # Fallback: try to find any "Response X" patterns in order
+    matches = re.findall(r'Response [A-Z]', ranking_text)
+    return matches
+def calculate_aggregate_rankings(
+    stage2_results: List[Dict[str, Any]],
+    label_to_model: Dict[str, str]
+) -> List[Dict[str, Any]]:
+    """
+    Calculate aggregate rankings across all models.
+    Args:
+        stage2_results: Rankings from each model
+        label_to_model: Mapping from anonymous labels to model names
+    Returns:
+        List of dicts with model name and average rank, sorted best to worst
+    """
+    from collections import defaultdict
+    # Track positions for each model
+    model_positions = defaultdict(list)
+    for ranking in stage2_results:
+        ranking_text = ranking['ranking']
+        # Parse the ranking from the structured format
+        parsed_ranking = parse_ranking_from_text(ranking_text)
+        for position, label in enumerate(parsed_ranking, start=1):
+            if label in label_to_model:
+                model_name = label_to_model[label]
+                model_positions[model_name].append(position)
+    # Calculate average position for each model
+    aggregate = []
+    for model, positions in model_positions.items():
+        if positions:
+            avg_rank = sum(positions) / len(positions)
+            aggregate.append({
+                "model": model,
+                "average_rank": round(avg_rank, 2),
+                "rankings_count": len(positions)
+            })
+    # Sort by average rank (lower is better)
+    aggregate.sort(key=lambda x: x['average_rank'])
+    return aggregate
+async def generate_conversation_title(user_query: str) -> str:
+    """
+    Generate a short title for a conversation based on the first user message.
+    Args:
+        user_query: The first user message
+    Returns:
+        A short title (3-5 words)
+    """
+    title_prompt = f"""Generate a very short title (3-5 words maximum) that summarizes the following question.
+The title should be concise and descriptive. Do not use quotes or punctuation in the title.
+Question: {user_query}
+Title:"""
+    messages = [{"role": "user", "content": title_prompt}]
+    # Use gemini-2.5-flash for title generation (fast and cheap)
+    response = await query_model("google/gemini-2.5-flash", messages, timeout=30.0)
+    if response is None:
+        # Fallback to a generic title
+        return "New Conversation"
+    title = response.get('content', 'New Conversation').strip()
+    # Clean up the title - remove quotes, limit length
+    title = title.strip('"\'')
+    # Truncate if too long
+    if len(title) > 50:
+        title = title[:47] + "..."
+    return title
+async def run_full_council(user_query: str) -> Tuple[List, List, Dict, Dict]:
+    """
+    Run the complete 3-stage council process.
+    Args:
+        user_query: The user's question
+    Returns:
+        Tuple of (stage1_results, stage2_results, stage3_result, metadata)
+    """
+    # Stage 1: Collect individual responses
+    stage1_results = await stage1_collect_responses(user_query)
+    # If no models responded successfully, return error
+    if not stage1_results:
+        return [], [], {
+            "model": "error",
+            "response": "All models failed to respond. Please try again."
+        }, {}
+    # Stage 2: Collect rankings
+    stage2_results, label_to_model = await stage2_collect_rankings(user_query, stage1_results)
+    # Calculate aggregate rankings
+    aggregate_rankings = calculate_aggregate_rankings(stage2_results, label_to_model)
+    # Stage 3: Synthesize final answer
+    stage3_result = await stage3_synthesize_final(
+        user_query,
+        stage1_results,
+        stage2_results
+    )
+    # Prepare metadata
+    metadata = {
+        "label_to_model": label_to_model,
+        "aggregate_rankings": aggregate_rankings
+    }
+    return stage1_results, stage2_results, stage3_result, metadata

backend/debug_models.py ADDED Viewed

	@@ -0,0 +1,24 @@

+import asyncio
+import os
+from backend.openrouter import query_model
+from backend.config import COUNCIL_MODELS
+async def test_models():
+    print("Testing OpenRouter connection...")
+    print(f"API Key present: {'Yes' if os.getenv('OPENROUTER_API_KEY') else 'No'}")
+    messages = [{"role": "user", "content": "Say hello!"}]
+    for model in COUNCIL_MODELS:
+        print(f"\nTesting model: {model}")
+        response = await query_model(model, messages, timeout=30.0)
+        if response:
+            print("✅ Success!")
+            print(f"Response: {response.get('content')[:50]}...")
+        else:
+            print("❌ Failed")
+if __name__ == "__main__":
+    asyncio.run(test_models())

backend/main.py ADDED Viewed

	@@ -0,0 +1,199 @@

+"""FastAPI backend for LLM Council."""
+from fastapi import FastAPI, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import StreamingResponse
+from pydantic import BaseModel
+from typing import List, Dict, Any
+import uuid
+import json
+import asyncio
+from . import storage
+from .council import run_full_council, generate_conversation_title, stage1_collect_responses, stage2_collect_rankings, stage3_synthesize_final, calculate_aggregate_rankings
+app = FastAPI(title="LLM Council API")
+# Enable CORS for local development
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["http://localhost:5173", "http://localhost:3000"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+class CreateConversationRequest(BaseModel):
+    """Request to create a new conversation."""
+    pass
+class SendMessageRequest(BaseModel):
+    """Request to send a message in a conversation."""
+    content: str
+class ConversationMetadata(BaseModel):
+    """Conversation metadata for list view."""
+    id: str
+    created_at: str
+    title: str
+    message_count: int
+class Conversation(BaseModel):
+    """Full conversation with all messages."""
+    id: str
+    created_at: str
+    title: str
+    messages: List[Dict[str, Any]]
+@app.get("/")
+async def root():
+    """Health check endpoint."""
+    return {"status": "ok", "service": "LLM Council API"}
+@app.get("/api/conversations", response_model=List[ConversationMetadata])
+async def list_conversations():
+    """List all conversations (metadata only)."""
+    return storage.list_conversations()
+@app.post("/api/conversations", response_model=Conversation)
+async def create_conversation(request: CreateConversationRequest):
+    """Create a new conversation."""
+    conversation_id = str(uuid.uuid4())
+    conversation = storage.create_conversation(conversation_id)
+    return conversation
+@app.get("/api/conversations/{conversation_id}", response_model=Conversation)
+async def get_conversation(conversation_id: str):
+    """Get a specific conversation with all its messages."""
+    conversation = storage.get_conversation(conversation_id)
+    if conversation is None:
+        raise HTTPException(status_code=404, detail="Conversation not found")
+    return conversation
+@app.post("/api/conversations/{conversation_id}/message")
+async def send_message(conversation_id: str, request: SendMessageRequest):
+    """
+    Send a message and run the 3-stage council process.
+    Returns the complete response with all stages.
+    """
+    # Check if conversation exists
+    conversation = storage.get_conversation(conversation_id)
+    if conversation is None:
+        raise HTTPException(status_code=404, detail="Conversation not found")
+    # Check if this is the first message
+    is_first_message = len(conversation["messages"]) == 0
+    # Add user message
+    storage.add_user_message(conversation_id, request.content)
+    # If this is the first message, generate a title
+    if is_first_message:
+        title = await generate_conversation_title(request.content)
+        storage.update_conversation_title(conversation_id, title)
+    # Run the 3-stage council process
+    stage1_results, stage2_results, stage3_result, metadata = await run_full_council(
+        request.content
+    )
+    # Add assistant message with all stages
+    storage.add_assistant_message(
+        conversation_id,
+        stage1_results,
+        stage2_results,
+        stage3_result
+    )
+    # Return the complete response with metadata
+    return {
+        "stage1": stage1_results,
+        "stage2": stage2_results,
+        "stage3": stage3_result,
+        "metadata": metadata
+    }
+@app.post("/api/conversations/{conversation_id}/message/stream")
+async def send_message_stream(conversation_id: str, request: SendMessageRequest):
+    """
+    Send a message and stream the 3-stage council process.
+    Returns Server-Sent Events as each stage completes.
+    """
+    # Check if conversation exists
+    conversation = storage.get_conversation(conversation_id)
+    if conversation is None:
+        raise HTTPException(status_code=404, detail="Conversation not found")
+    # Check if this is the first message
+    is_first_message = len(conversation["messages"]) == 0
+    async def event_generator():
+        try:
+            # Add user message
+            storage.add_user_message(conversation_id, request.content)
+            # Start title generation in parallel (don't await yet)
+            title_task = None
+            if is_first_message:
+                title_task = asyncio.create_task(generate_conversation_title(request.content))
+            # Stage 1: Collect responses
+            yield f"data: {json.dumps({'type': 'stage1_start'})}\n\n"
+            stage1_results = await stage1_collect_responses(request.content)
+            yield f"data: {json.dumps({'type': 'stage1_complete', 'data': stage1_results})}\n\n"
+            # Stage 2: Collect rankings
+            yield f"data: {json.dumps({'type': 'stage2_start'})}\n\n"
+            stage2_results, label_to_model = await stage2_collect_rankings(request.content, stage1_results)
+            aggregate_rankings = calculate_aggregate_rankings(stage2_results, label_to_model)
+            yield f"data: {json.dumps({'type': 'stage2_complete', 'data': stage2_results, 'metadata': {'label_to_model': label_to_model, 'aggregate_rankings': aggregate_rankings}})}\n\n"
+            # Stage 3: Synthesize final answer
+            yield f"data: {json.dumps({'type': 'stage3_start'})}\n\n"
+            stage3_result = await stage3_synthesize_final(request.content, stage1_results, stage2_results)
+            yield f"data: {json.dumps({'type': 'stage3_complete', 'data': stage3_result})}\n\n"
+            # Wait for title generation if it was started
+            if title_task:
+                title = await title_task
+                storage.update_conversation_title(conversation_id, title)
+                yield f"data: {json.dumps({'type': 'title_complete', 'data': {'title': title}})}\n\n"
+            # Save complete assistant message
+            storage.add_assistant_message(
+                conversation_id,
+                stage1_results,
+                stage2_results,
+                stage3_result
+            )
+            # Send completion event
+            yield f"data: {json.dumps({'type': 'complete'})}\n\n"
+        except Exception as e:
+            # Send error event
+            yield f"data: {json.dumps({'type': 'error', 'message': str(e)})}\n\n"
+    return StreamingResponse(
+        event_generator(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "Connection": "keep-alive",
+        }
+    )
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=8001)

backend/openrouter.py ADDED Viewed

	@@ -0,0 +1,79 @@

+"""OpenRouter API client for making LLM requests."""
+import httpx
+from typing import List, Dict, Any, Optional
+from .config import OPENROUTER_API_KEY, OPENROUTER_API_URL
+async def query_model(
+    model: str,
+    messages: List[Dict[str, str]],
+    timeout: float = 120.0
+) -> Optional[Dict[str, Any]]:
+    """
+    Query a single model via OpenRouter API.
+    Args:
+        model: OpenRouter model identifier (e.g., "openai/gpt-4o")
+        messages: List of message dicts with 'role' and 'content'
+        timeout: Request timeout in seconds
+    Returns:
+        Response dict with 'content' and optional 'reasoning_details', or None if failed
+    """
+    headers = {
+        "Authorization": f"Bearer {OPENROUTER_API_KEY}",
+        "Content-Type": "application/json",
+    }
+    payload = {
+        "model": model,
+        "messages": messages,
+    }
+    try:
+        async with httpx.AsyncClient(timeout=timeout) as client:
+            response = await client.post(
+                OPENROUTER_API_URL,
+                headers=headers,
+                json=payload
+            )
+            response.raise_for_status()
+            data = response.json()
+            message = data['choices'][0]['message']
+            return {
+                'content': message.get('content'),
+                'reasoning_details': message.get('reasoning_details')
+            }
+    except Exception as e:
+        print(f"Error querying model {model}: {e}")
+        return None
+async def query_models_parallel(
+    models: List[str],
+    messages: List[Dict[str, str]]
+) -> Dict[str, Optional[Dict[str, Any]]]:
+    """
+    Query multiple models in parallel.
+    Args:
+        models: List of OpenRouter model identifiers
+        messages: List of message dicts to send to each model
+    Returns:
+        Dict mapping model identifier to response dict (or None if failed)
+    """
+    import asyncio
+    # Create tasks for all models
+    tasks = [query_model(model, messages) for model in models]
+    # Wait for all to complete
+    responses = await asyncio.gather(*tasks)
+    # Map models to their responses
+    return {model: response for model, response in zip(models, responses)}

backend/storage.py ADDED Viewed

	@@ -0,0 +1,172 @@

+"""JSON-based storage for conversations."""
+import json
+import os
+from datetime import datetime
+from typing import List, Dict, Any, Optional
+from pathlib import Path
+from .config import DATA_DIR
+def ensure_data_dir():
+    """Ensure the data directory exists."""
+    Path(DATA_DIR).mkdir(parents=True, exist_ok=True)
+def get_conversation_path(conversation_id: str) -> str:
+    """Get the file path for a conversation."""
+    return os.path.join(DATA_DIR, f"{conversation_id}.json")
+def create_conversation(conversation_id: str) -> Dict[str, Any]:
+    """
+    Create a new conversation.
+    Args:
+        conversation_id: Unique identifier for the conversation
+    Returns:
+        New conversation dict
+    """
+    ensure_data_dir()
+    conversation = {
+        "id": conversation_id,
+        "created_at": datetime.utcnow().isoformat(),
+        "title": "New Conversation",
+        "messages": []
+    }
+    # Save to file
+    path = get_conversation_path(conversation_id)
+    with open(path, 'w') as f:
+        json.dump(conversation, f, indent=2)
+    return conversation
+def get_conversation(conversation_id: str) -> Optional[Dict[str, Any]]:
+    """
+    Load a conversation from storage.
+    Args:
+        conversation_id: Unique identifier for the conversation
+    Returns:
+        Conversation dict or None if not found
+    """
+    path = get_conversation_path(conversation_id)
+    if not os.path.exists(path):
+        return None
+    with open(path, 'r') as f:
+        return json.load(f)
+def save_conversation(conversation: Dict[str, Any]):
+    """
+    Save a conversation to storage.
+    Args:
+        conversation: Conversation dict to save
+    """
+    ensure_data_dir()
+    path = get_conversation_path(conversation['id'])
+    with open(path, 'w') as f:
+        json.dump(conversation, f, indent=2)
+def list_conversations() -> List[Dict[str, Any]]:
+    """
+    List all conversations (metadata only).
+    Returns:
+        List of conversation metadata dicts
+    """
+    ensure_data_dir()
+    conversations = []
+    for filename in os.listdir(DATA_DIR):
+        if filename.endswith('.json'):
+            path = os.path.join(DATA_DIR, filename)
+            with open(path, 'r') as f:
+                data = json.load(f)
+                # Return metadata only
+                conversations.append({
+                    "id": data["id"],
+                    "created_at": data["created_at"],
+                    "title": data.get("title", "New Conversation"),
+                    "message_count": len(data["messages"])
+                })
+    # Sort by creation time, newest first
+    conversations.sort(key=lambda x: x["created_at"], reverse=True)
+    return conversations
+def add_user_message(conversation_id: str, content: str):
+    """
+    Add a user message to a conversation.
+    Args:
+        conversation_id: Conversation identifier
+        content: User message content
+    """
+    conversation = get_conversation(conversation_id)
+    if conversation is None:
+        raise ValueError(f"Conversation {conversation_id} not found")
+    conversation["messages"].append({
+        "role": "user",
+        "content": content
+    })
+    save_conversation(conversation)
+def add_assistant_message(
+    conversation_id: str,
+    stage1: List[Dict[str, Any]],
+    stage2: List[Dict[str, Any]],
+    stage3: Dict[str, Any]
+):
+    """
+    Add an assistant message with all 3 stages to a conversation.
+    Args:
+        conversation_id: Conversation identifier
+        stage1: List of individual model responses
+        stage2: List of model rankings
+        stage3: Final synthesized response
+    """
+    conversation = get_conversation(conversation_id)
+    if conversation is None:
+        raise ValueError(f"Conversation {conversation_id} not found")
+    conversation["messages"].append({
+        "role": "assistant",
+        "stage1": stage1,
+        "stage2": stage2,
+        "stage3": stage3
+    })
+    save_conversation(conversation)
+def update_conversation_title(conversation_id: str, title: str):
+    """
+    Update the title of a conversation.
+    Args:
+        conversation_id: Conversation identifier
+        title: New title for the conversation
+    """
+    conversation = get_conversation(conversation_id)
+    if conversation is None:
+        raise ValueError(f"Conversation {conversation_id} not found")
+    conversation["title"] = title
+    save_conversation(conversation)