Spaces:

melkani
/

eldersafe

Running

File size: 6,591 Bytes

import os
import traceback
import uuid

from google.adk.agents import Agent, LlmAgent, SequentialAgent
from google.adk.models.google_llm import Gemini
from google.adk.runners import Runner
from google.adk.sessions import InMemorySessionService
from google.adk.memory import InMemoryMemoryService
from google.adk.tools import google_search, load_memory
from google.genai import types

# ---------- 1. API KEY SETUP (Hugging Face Secret) ----------

GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")

if not GOOGLE_API_KEY:
    # On HF, set this in: Settings -> Variables and secrets -> New secret: GOOGLE_API_KEY
    raise RuntimeError(
        "GOOGLE_API_KEY is not set. Please add it as a secret in your Hugging Face Space."
    )

os.environ["GOOGLE_API_KEY"] = GOOGLE_API_KEY

# ---------- 2. ADK CONFIG ----------

retry_config = types.HttpRetryOptions(
    attempts=5,
    exp_base=7,
    initial_delay=1,
    http_status_codes=[429, 500, 503, 504],
)

APP_NAME = "FakeNewsApp"
USER_ID = "demo_user"

session_service = InMemorySessionService()
memory_service = InMemoryMemoryService()

# ----------3. generate session_id ------------
def generate_session_id():
    return str(uuid.uuid4())

# ---------- 4. AGENTS ----------

claim_extractor_agent = Agent(
    name="ClaimExtractorAgent",
    model=Gemini(
        model="gemini-2.5-flash-lite",
        retry_options=retry_config,
    ),
    instruction="""
    You will receive a WhatsApp forward or viral message.

    TASK:
    1. Identify ONE main factual claim in clean, simple form.
    2. Rewrite it in one sentence.
    3. Extract 3–5 search keywords.

    OUTPUT FORMAT:
    Claim: <cleaned claim>
    Keywords: <comma separated keywords>
    """,
    output_key="extracted_claim",
)

evidence_search_agent = Agent(
    name="EvidenceSearchAgent",
    model=Gemini(
        model="gemini-2.5-flash-lite",
        retry_options=retry_config,
    ),
    tools=[google_search],
    instruction="""
    You will receive extracted claim info:

    {extracted_claim}

    TASK:
    1. Use google_search with 2–3 queries:
       - "<claim> fact check"
       - "<keywords> news"
       - "<keywords> official site"
    2. Return 5–7 useful results with:
       - title
       - url
       - snippet
       - source type (gov, fact-check, news, blog)

    OUTPUT FORMAT:
    <list of sources in bullet points>
    """,
    output_key="search_results",
)

verdict_agent = Agent(
    name="VerdictAgent",
    model=Gemini(
        model="gemini-2.5-flash", # earlier using gemini-2.5-flash-lite
        retry_options=retry_config,
    ),
    instruction="""
    You will receive search results:

    {search_results}

    TASK:
    1. For each source, decide SUPPORT / REFUTE / IRRELEVANT.
    2. Produce a Markdown table:
       | Source | Type | Stance | Summary |
    3. Decide the final verdict:
       - Mostly refute → Likely FALSE
       - Mostly support → Likely TRUE
       - Mixed → Partly true/misleading
       - No credible sources → Unverified – Do not share
    4. Write a SIMPLE explanation for elderly users.

    OUTPUT FORMAT:
    Evidence Table:
    <table>

    Verdict:
    <verdict>

    Explanation:
    <simple explanation>
    """,
    output_key="final_report",
)

memory_agent = LlmAgent(
    name="MemoryAgent",
    model=Gemini(
        model="gemini-2.5-flash-lite",
        retry_options=retry_config,
    ),
    tools=[load_memory],
    instruction="""
    You are a background history fetcher. You are NOT a chatbot. 
    
    YOUR STRICT COMMANDS:
    1. IGNORE any input text you receive from previous agents.
    2. IMMEDIATELY call the function `load_memory` to get the user's past sessions.
    3. Once you receive the memory data, extract and list the distinct claims found.
    4. Return ONLY a bulleted list of the last 2 claims.
    
    IF NO MEMORY DATA IS RETURNED:
    - Output: "No previous checks found."
    
    DO NOT ask "Would you like me to?". DO NOT explain what you are doing. JUST RUN THE TOOL.
    """,
    output_key="recent_claims",
)

root_agent = SequentialAgent(
    name="FakeNewsPipeline",
    sub_agents=[
        claim_extractor_agent,
        evidence_search_agent,
        verdict_agent,
        memory_agent,
    ],
)

runner = Runner(
    agent=root_agent,
    app_name=APP_NAME,
    session_service=session_service,
    memory_service=memory_service,
)

# ---------- 5. PUBLIC FUNCTION USED BY GRADIO ----------

async def run_eldersafe(query: str, session_id: str = None) -> dict:
    if session_id is None:
        session_id = generate_session_id()
    """
    Runs the full ElderSafe pipeline and returns a dict:
    {
        "clean_claim": str,
        "final_report": str (markdown),
        "memory_context": str,
    }
    This is the function Gradio will call.
    """
    try:
        # Ensure session exists (ignore if already created)
        try:
            await session_service.create_session(
                app_name=APP_NAME,
                user_id=USER_ID,
                session_id=session_id,
            )
        except Exception:
            pass
        
        # Prepare ADK content input
        user_msg = types.Content(
            role="user",
            parts=[types.Part(text=query)],
        )

        # Run pipeline silently
        async for _ in runner.run_async(
            user_id=USER_ID,
            session_id=session_id,
            new_message=user_msg,
        ):
            pass

        # Get session and store in memory
        session = await session_service.get_session(
            app_name=APP_NAME,
            user_id=USER_ID,
            session_id=session_id,
        )

        await memory_service.add_session_to_memory(session)

        # Extract outputs
        claim = session.state.get("extracted_claim", "No claim extracted.")
        if isinstance(claim, str) and "Claim:" in claim:
            clean_claim = claim.split("Keywords:")[0].replace("Claim:", "").strip()
        else:
            clean_claim = str(claim)

        final_report = session.state.get("final_report", "Analysis failed.")
        memory_context = session.state.get("recent_claims", "")

        return {
            "clean_claim": clean_claim,
            "final_report": final_report,
            "memory_context": memory_context,
        }

    except Exception:
        # In case something goes wrong, return a debug string
        return {
            "clean_claim": query,
            "final_report": "❌ An error occurred:\n\n" + traceback.format_exc(),
            "memory_context": "",
        }