Spaces:

Murali-rade
/

final-gaia-agent

Sleeping

App Files Files Community

Murali-rade commited on Oct 5

Commit

ab94df5

verified ·

1 Parent(s): bcdf7ac

Rename code_interpreter.py to logic.py

Browse files

Files changed (2) hide show

code_interpreter.py +0 -281
logic.py +196 -0

code_interpreter.py DELETED Viewed

@@ -1,281 +0,0 @@
-import os
-import io
-import sys
-import uuid
-import base64
-import traceback
-import contextlib
-import tempfile
-import subprocess
-import sqlite3
-from typing import Dict, List, Any, Optional, Union
-import numpy as np
-import pandas as pd
-import matplotlib.pyplot as plt
-from PIL import Image
-class CodeInterpreter:
-    def __init__(self, allowed_modules=None, max_execution_time=30, working_directory=None):
-        """Initialize the code interpreter with safety measures."""
-        self.allowed_modules = allowed_modules or [
-            "numpy", "pandas", "matplotlib", "scipy", "sklearn",
-            "math", "random", "statistics", "datetime", "collections",
-            "itertools", "functools", "operator", "re", "json",
-            "sympy", "networkx", "nltk", "PIL", "pytesseract",
-            "cmath", "uuid", "tempfile", "requests", "urllib"
-        ]
-        self.max_execution_time = max_execution_time
-        self.working_directory = working_directory or os.path.join(os.getcwd())
-        if not os.path.exists(self.working_directory):
-            os.makedirs(self.working_directory)
-        self.globals = {
-            "__builtins__": __builtins__,
-            "np": np,
-            "pd": pd,
-            "plt": plt,
-            "Image": Image,
-        }
-        self.temp_sqlite_db = os.path.join(tempfile.gettempdir(), "code_exec.db")
-    def execute_code(self, code: str, language: str = "python") -> Dict[str, Any]:
-        """Execute the provided code in the selected programming language."""
-        language = language.lower()
-        execution_id = str(uuid.uuid4())
-        result = {
-            "execution_id": execution_id,
-            "status": "error",
-            "stdout": "",
-            "stderr": "",
-            "result": None,
-            "plots": [],
-            "dataframes": []
-        }
-        try:
-            if language == "python":
-                return self._execute_python(code, execution_id)
-            elif language == "bash":
-                return self._execute_bash(code, execution_id)
-            elif language == "sql":
-                return self._execute_sql(code, execution_id)
-            elif language == "c":
-                return self._execute_c(code, execution_id)
-            elif language == "java":
-                return self._execute_java(code, execution_id)
-            else:
-                result["stderr"] = f"Unsupported language: {language}"
-        except Exception as e:
-            result["stderr"] = str(e)
-        return result
-    def _execute_python(self, code: str, execution_id: str) -> dict:
-        output_buffer = io.StringIO()
-        error_buffer = io.StringIO()
-        result = {
-            "execution_id": execution_id,
-            "status": "error",
-            "stdout": "",
-            "stderr": "",
-            "result": None,
-            "plots": [],
-            "dataframes": []
-        }
-        try:
-            exec_dir = os.path.join(self.working_directory, execution_id)
-            os.makedirs(exec_dir, exist_ok=True)
-            plt.switch_backend('Agg')
-            with contextlib.redirect_stdout(output_buffer), contextlib.redirect_stderr(error_buffer):
-                exec_result = exec(code, self.globals)
-                if plt.get_fignums():
-                    for i, fig_num in enumerate(plt.get_fignums()):
-                        fig = plt.figure(fig_num)
-                        img_path = os.path.join(exec_dir, f"plot_{i}.png")
-                        fig.savefig(img_path)
-                        with open(img_path, "rb") as img_file:
-                            img_data = base64.b64encode(img_file.read()).decode('utf-8')
-                            result["plots"].append({
-                                "figure_number": fig_num,
-                                "data": img_data
-                            })
-                for var_name, var_value in self.globals.items():
-                    if isinstance(var_value, pd.DataFrame) and len(var_value) > 0:
-                        result["dataframes"].append({
-                            "name": var_name,
-                            "head": var_value.head().to_dict(),
-                            "shape": var_value.shape,
-                            "dtypes": str(var_value.dtypes)
-                        })
-            result["status"] = "success"
-            result["stdout"] = output_buffer.getvalue()
-            result["result"] = exec_result
-        except Exception as e:
-            result["status"] = "error"
-            result["stderr"] = f"{error_buffer.getvalue()}\n{traceback.format_exc()}"
-        return result
-    def _execute_bash(self, code: str, execution_id: str) -> dict:
-        try:
-            completed = subprocess.run(
-                code, shell=True, capture_output=True, text=True, timeout=self.max_execution_time
-            )
-            return {
-                "execution_id": execution_id,
-                "status": "success" if completed.returncode == 0 else "error",
-                "stdout": completed.stdout,
-                "stderr": completed.stderr,
-                "result": None,
-                "plots": [],
-                "dataframes": []
-            }
-        except subprocess.TimeoutExpired:
-            return {
-                "execution_id": execution_id,
-                "status": "error",
-                "stdout": "",
-                "stderr": "Execution timed out.",
-                "result": None,
-                "plots": [],
-                "dataframes": []
-            }
-    def _execute_sql(self, code: str, execution_id: str) -> dict:
-        result = {
-            "execution_id": execution_id,
-            "status": "error",
-            "stdout": "",
-            "stderr": "",
-            "result": None,
-            "plots": [],
-            "dataframes": []
-        }
-        try:
-            conn = sqlite3.connect(self.temp_sqlite_db)
-            cur = conn.cursor()
-            cur.execute(code)
-            if code.strip().lower().startswith("select"):
-                columns = [description[0] for description in cur.description]
-                rows = cur.fetchall()
-                df = pd.DataFrame(rows, columns=columns)
-                result["dataframes"].append({
-                    "name": "query_result",
-                    "head": df.head().to_dict(),
-                    "shape": df.shape,
-                    "dtypes": str(df.dtypes)
-                })
-            else:
-                conn.commit()
-            result["status"] = "success"
-            result["stdout"] = "Query executed successfully."
-        except Exception as e:
-            result["stderr"] = str(e)
-        finally:
-            conn.close()
-        return result
-    def _execute_c(self, code: str, execution_id: str) -> dict:
-        temp_dir = tempfile.mkdtemp()
-        source_path = os.path.join(temp_dir, "program.c")
-        binary_path = os.path.join(temp_dir, "program")
-        try:
-            with open(source_path, "w") as f:
-                f.write(code)
-            compile_proc = subprocess.run(
-                ["gcc", source_path, "-o", binary_path],
-                capture_output=True, text=True, timeout=self.max_execution_time
-            )
-            if compile_proc.returncode != 0:
-                return {
-                    "execution_id": execution_id,
-                    "status": "error",
-                    "stdout": compile_proc.stdout,
-                    "stderr": compile_proc.stderr,
-                    "result": None,
-                    "plots": [],
-                    "dataframes": []
-                }
-            run_proc = subprocess.run(
-                [binary_path],
-                capture_output=True, text=True, timeout=self.max_execution_time
-            )
-            return {
-                "execution_id": execution_id,
-                "status": "success" if run_proc.returncode == 0 else "error",
-                "stdout": run_proc.stdout,
-                "stderr": run_proc.stderr,
-                "result": None,
-                "plots": [],
-                "dataframes": []
-            }
-        except Exception as e:
-            return {
-                "execution_id": execution_id,
-                "status": "error",
-                "stdout": "",
-                "stderr": str(e),
-                "result": None,
-                "plots": [],
-                "dataframes": []
-            }
-    def _execute_java(self, code: str, execution_id: str) -> dict:
-        temp_dir = tempfile.mkdtemp()
-        source_path = os.path.join(temp_dir, "Main.java")
-        try:
-            with open(source_path, "w") as f:
-                f.write(code)
-            compile_proc = subprocess.run(
-                ["javac", source_path],
-                capture_output=True, text=True, timeout=self.max_execution_time
-            )
-            if compile_proc.returncode != 0:
-                return {
-                    "execution_id": execution_id,
-                    "status": "error",
-                    "stdout": compile_proc.stdout,
-                    "stderr": compile_proc.stderr,
-                    "result": None,
-                    "plots": [],
-                    "dataframes": []
-                }
-            run_proc = subprocess.run(
-                ["java", "-cp", temp_dir, "Main"],
-                capture_output=True, text=True, timeout=self.max_execution_time
-            )
-            return {
-                "execution_id": execution_id,
-                "status": "success" if run_proc.returncode == 0 else "error",
-                "stdout": run_proc.stdout,
-                "stderr": run_proc.stderr,
-                "result": None,
-                "plots": [],
-                "dataframes": []
-            }
-        except Exception as e:
-            return {
-                "execution_id": execution_id,
-                "status": "error",
-                "stdout": "",
-                "stderr": str(e),
-                "result": None,
-                "plots": [],
-                "dataframes": []
-            }

logic.py ADDED Viewed

	@@ -0,0 +1,196 @@

+from typing import Dict, List, Tuple
+import re
+import tempfile
+from pathlib import Path
+import pandas as pd
+import requests
+from agent import GaiaAgent
+from pandas import DataFrame
+# --- Constants ---
+DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+QUESTIONS_URL = f"{DEFAULT_API_URL}/questions"
+SUBMIT_URL = f"{DEFAULT_API_URL}/submit"
+FILE_PATH = f"{DEFAULT_API_URL}/files/"
+# --- Helper Methods ---
+def fetch_all_questions() -> Dict:
+    """Fetches all questions from the specified API endpoint.
+    This function retrieves a list of questions from the API, handles potential errors
+    such as network issues, invalid responses, or empty question lists, and returns
+    the questions as a dictionary.
+    Returns:
+        Dict: A dictionary containing the questions data retrieved from the API.
+    Raises:
+        UserWarning: If there is an error fetching the questions, such as network issues,
+            invalid JSON response, or an empty question list.  The exception message
+            provides details about the specific error encountered.
+    """
+    print(f"Fetching questions from: {QUESTIONS_URL}")
+    response = requests.get(QUESTIONS_URL, timeout=15)
+    try:
+        response.raise_for_status()
+        questions_data = response.json()
+        if not questions_data:
+            print("Fetched questions list is empty.")
+            raise UserWarning("Fetched questions list is empty or invalid format.")
+        print(f"Fetched {len(questions_data)} questions.")
+        return questions_data
+    except requests.exceptions.RequestException as e:
+        print(f"Error fetching questions: {e}")
+        raise UserWarning(f"Error fetching questions: {e}")
+    except requests.exceptions.JSONDecodeError as e:
+        print(f"Error decoding JSON response from questions endpoint: {e}")
+        print(f"Response text: {response.text[:500]}")
+        raise UserWarning(f"Error decoding server response for questions: {e}")
+    except Exception as e:
+        print(f"An unexpected error occurred fetching questions: {e}")
+        raise UserWarning(f"An unexpected error occurred fetching questions: {e}")
+def submit_answers(submission_data: dict, results_log: list) -> Tuple[str, DataFrame]:
+    """Submits answers to the scoring API and returns the submission status and results.
+    This function sends the provided answers to the scoring API, handles potential errors
+    such as network issues, server errors, or invalid responses, and returns a status
+    message indicating the success or failure of the submission, along with a DataFrame
+    containing the results log.
+    Args:
+        submission_data (dict): A dictionary containing the answers to be submitted.
+            Expected to have a structure compatible with the scoring API.
+        results_log (list): A list of dictionaries containing the results log.
+            This log is converted to a Pandas DataFrame and returned.
+    Returns:
+        Tuple[str, DataFrame]: A tuple containing:
+            - A status message (str) indicating the submission status and any relevant
+              information or error messages.
+            - A Pandas DataFrame containing the results log.
+    """
+    try:
+        response = requests.post(SUBMIT_URL, json=submission_data, timeout=60)
+        response.raise_for_status()
+        result_data = response.json()
+        final_status = (
+            f"Submission Successful!\n"
+            f"User: {result_data.get('username')}\n"
+            f"Overall Score: {result_data.get('score', 'N/A')}% "
+            f"({result_data.get('correct_count', '?')}/"
+            f"{result_data.get('total_attempted', '?')} correct)\n"
+            f"Message: {result_data.get('message', 'No message received.')}"
+        )
+        print("Submission successful.")
+        results_df = pd.DataFrame(results_log)
+        return final_status, results_df
+    except requests.exceptions.HTTPError as e:
+        error_detail = f"Server responded with status {e.response.status_code}."
+        try:
+            error_json = e.response.json()
+            error_detail += f" Detail: {error_json.get('detail', e.response.text)}"
+        except requests.exceptions.JSONDecodeError:
+            error_detail += f" Response: {e.response.text[:500]}"
+        status_message = f"Submission Failed: {error_detail}"
+        print(status_message)
+        results_df = pd.DataFrame(results_log)
+        return status_message, results_df
+    except requests.exceptions.Timeout:
+        status_message = "Submission Failed: The request timed out."
+        print(status_message)
+        results_df = pd.DataFrame(results_log)
+        return status_message, results_df
+    except requests.exceptions.RequestException as e:
+        status_message = f"Submission Failed: Network error - {e}"
+        print(status_message)
+        results_df = pd.DataFrame(results_log)
+        return status_message, results_df
+    except Exception as e:
+        status_message = f"An unexpected error occurred during submission: {e}"
+        print(status_message)
+        results_df = pd.DataFrame(results_log)
+        return status_message, results_df
+def run_agent(
+    gaia_agent: GaiaAgent, questions_data: List[Dict]
+) -> Tuple[List[Dict], List[Dict]]:
+    """Runs the agent on a list of questions and returns the results and answers.
+    This function iterates through a list of questions, runs the provided agent on each
+    question, and collects the results and answers. It handles potential errors during
+    agent execution and returns the results log and the answers payload.
+    Args:
+        gaia_agent (GaiaAgent): An instance of the GaiaAgent class, which is responsible for
+            generating answers to the questions.
+        questions_data (List[Dict]): A list of dictionaries, where each dictionary
+            represents a question and contains at least the 'task_id' and 'question' keys.
+    Returns:
+        Tuple[List[Dict], List[Dict]]: A tuple containing:
+            - A list of dictionaries representing the results log, where each dictionary
+              contains the 'Task ID', 'Question', and 'Submitted Answer'.
+            - A list of dictionaries representing the answers payload, where each dictionary
+              contains the 'task_id' and 'submitted_answer'.
+    """
+    results_log = []
+    answers_payload = []
+    print(f"🚀 Running agent on {len(questions_data)} questions...")
+    for item in questions_data:
+        task_id = item.get("task_id")
+        question_text = item.get("question")
+        question_text = process_file(task_id, question_text)
+        if not task_id or question_text is None:
+            print(f"⚠️ Skipping invalid item (missing task_id or question): {item}")
+            continue
+        try:
+            submitted_answer = gaia_agent(task_id, question_text)
+            answers_payload.append(
+                {"task_id": task_id, "submitted_answer": submitted_answer}
+            )
+        except Exception as e:
+            print(f"❌ Error running agent on task {task_id}: {e}")
+            submitted_answer = f"AGENT ERROR: {e}"
+        results_log.append(
+            {
+                "Task ID": task_id,
+                "Question": question_text,
+                "Submitted Answer": submitted_answer,
+            }
+        )
+    return results_log, answers_payload
+def process_file(task_id: str, question_text: str) -> str:
+    """
+    Attempt to download a file associated with a task from the API.
+    - If the file exists (HTTP 200), it is saved to a temp directory and the local file path is returned.
+    - If no file is found (HTTP 404), returns None.
+    - For all other HTTP errors, the exception is propagated to the caller.
+    """
+    file_url = f"{FILE_PATH}{task_id}"
+    try:
+        response = requests.get(file_url, timeout=30)
+        response.raise_for_status()
+    except requests.exceptions.RequestException as exc:
+        print(f"Exception in download_file>> {str(exc)}")
+        return question_text # Unable to get the file
+    # Determine filename from 'Content-Disposition' header, fallback to task_id
+    content_disposition = response.headers.get("content-disposition", "")
+    filename = task_id
+    match = re.search(r'filename="([^"]+)"', content_disposition)
+    if match:
+        filename = match.group(1)
+    # Save file in a temp directory
+    temp_storage_dir = Path(tempfile.gettempdir()) / "gaia_cached_files"
+    temp_storage_dir.mkdir(parents=True, exist_ok=True)
+    file_path = temp_storage_dir / filename
+    file_path.write_bytes(response.content)
+    return (
+                f"{question_text}\n\n"
+                f"---\n"
+                f"A file was downloaded for this task and saved locally at:\n"
+                f"{str(file_path)}\n"
+                f"---\n\n"
+            )