First_agent_template

Sleeping

File size: 7,618 Bytes

import os
from agent.utils import download_gaia_attachment_local
print(f"Current Working Directory: {os.getcwd()}")
from pathlib import Path
import shutil # For cleaning up directories

# --- IMPORTANT: Load .env file at the absolute beginning ---
# These imports and calls must happen before any other project-specific imports
# that might rely on environment variables (like agent.agent importing agent.nodes, etc.)
try:
    from dotenv import load_dotenv
    # Define PROJECT_ROOT very early so load_dotenv can use it
    PROJECT_ROOT = Path(__file__).resolve().parents[1]
    load_dotenv(dotenv_path=PROJECT_ROOT / ".env")
    if not os.getenv("OPENAI_API_KEY"):
        print("\nWARNING: OPENAI_API_KEY environment variable not set or empty after .env load.")
        print("Please ensure your .env file is in the project root and contains OPENAI_API_KEY=\"your_key_here\".")
        # You might want to raise an error here to stop execution if the key is critical
        # raise ValueError("OPENAI_API_KEY is not set. Cannot proceed without it.")
    else:
        print("OPENAI_API_KEY loaded successfully from .env file (via test_agent.py).")
except ImportError:
    print("Python 'dotenv' package not found. Install with: pip install python-dotenv")
    print("Please set OPENAI_API_KEY manually in your terminal (e.g., export OPENAI_API_KEY=\"your_key\").")
# --- End .env loading block ---


# Now, import other standard libraries
import json
import requests

# Import necessary components from your agent package
# These imports will now execute *after* the dotenv loading is complete
from agent.agent import app # This imports your compiled LangGraph workflow
from agent.nodes import AgentState # The TypedDict for your agent's state
from agent.config import DEFAULT_API_URL, USER_AGENT, ATTACHMENTS, ATTACHMENT_BASE_URL
from agent.utils import get_file_type, download_file


# --- Test Harness Configuration --
# PROJECT_ROOT is defined above in the dotenv block
TEST_DATA_DIR = PROJECT_ROOT / "data"
QUESTIONS_FILE = TEST_DATA_DIR / "questions.json"
ATTACHMENTS_DIR = TEST_DATA_DIR / "attachments"


def setup_test_environment():
    """Ensures necessary directories exist and cleans up old attachments."""
    print("Setting up test environment...")
    TEST_DATA_DIR.mkdir(exist_ok=True)
    ATTACHMENTS_DIR.mkdir(exist_ok=True)

    # Clear existing attachments to ensure a fresh run
    for item in ATTACHMENTS_DIR.iterdir():
        if item.is_file():
            item.unlink() # Delete files
        elif item.is_dir():
            shutil.rmtree(item) # Delete directories recursively
    print(f"Cleaned attachments directory: {ATTACHMENTS_DIR}")

    # Also clear the in-memory ATTACHMENTS global for a fresh test run
    ATTACHMENTS.clear()


def download_gaia_questions():
    """Downloads GAIA questions from the scoring server and saves them locally."""
    print(f"Downloading GAIA questions from {DEFAULT_API_URL}/questions ...")
    try:
        response = requests.get(
            f"{DEFAULT_API_URL}/questions",
            headers={"User-Agent": USER_AGENT},
            timeout=20 # Increased timeout for robustness
        )
        response.raise_for_status()
        questions = response.json()
        with open(QUESTIONS_FILE, "w", encoding="utf-8") as f:
            json.dump(questions, f, indent=4)
        print(f"Downloaded {len(questions)} questions to {QUESTIONS_FILE}")
        return questions
    except requests.exceptions.RequestException as e:
        print(f"Error downloading questions: {e}")
        return []


# Smart attachment handling in your test_agent.py

def run_local_agent_test():
    """Runs the agent with smart attachment handling"""
    setup_test_environment()

    # Load questions
    questions = []
    if QUESTIONS_FILE.exists():
        with open(QUESTIONS_FILE, "r", encoding="utf-8") as f:
            questions = json.load(f)
        print(f"Loaded {len(questions)} questions from {QUESTIONS_FILE}")
    if not questions:
        questions = download_gaia_questions()

    if not questions:
        print("No questions to process. Exiting local test.")
        return

    print("\n" + "="*50)
    print("Starting Local Agent Test Run")
    print("="*50 + "\n")

    results = []
    for i, q in enumerate(questions):
        print(f"\n--- Processing Question {i+1}/{len(questions)} (Task ID: {q['task_id']}) ---")
        
        # Reset ATTACHMENTS for each question
        ATTACHMENTS.clear() 

        # SMART: Only download if file_name is not empty
        attachment_id_for_state = None
        if q.get("file_name", "").strip():
            print(f"  File available: {q['file_name']}")
            print(f"  Attempting download from: {ATTACHMENT_BASE_URL}{q['task_id']}")
            attachment_id_for_state = download_gaia_attachment_local(q["task_id"])
            #debug code here
            # Right after your attachment download attempt:
            print(f"DEBUG CHECKPOINT:")
            print(f"  Question has file_name: '{q.get('file_name', '')}'")
            print(f"  Download attempt returned: {attachment_id_for_state}")
            print(f"  ATTACHMENTS now contains: {list(ATTACHMENTS.keys())}")
            print(f"  Passing attachment_id to agent: {attachment_id_for_state}")
            #end debug code
            if attachment_id_for_state:
                print(f"  ✅ Downloaded: {ATTACHMENTS[attachment_id_for_state]['name']}")
            else:
                print(f"  ❌ Download failed")
        else:
            print(f"  No attachment for this question")
        
        initial_state = AgentState(
            question=q["question"],
            answer="",
            extracted_data="",
            media_type="",
            attachment_id=attachment_id_for_state,
            task_id=q["task_id"],
        )

        try:
            # Invoke the LangGraph agent
            final_state = app.invoke(initial_state)

            predicted_answer = final_state["answer"]
            results.append({
                "task_id": q["task_id"],
                "question": q["question"],
                "predicted_answer": predicted_answer,
                "has_file": bool(q.get("file_name", "").strip()),
            })
            print(f"\n  Question: {q['question'][:100]}...")
            print(f"  Agent's Answer: {predicted_answer}")

        except Exception as e:
            error_msg = f"ERROR: Agent failed to process question {q['task_id']}: {e}"
            print(f"\n  {error_msg}")
            results.append({
                "task_id": q["task_id"],
                "question": q["question"],
                "predicted_answer": error_msg,
                "has_file": bool(q.get("file_name", "").strip()),
            })

    print("\n" + "="*50)
    print("Local Agent Test Run Summary")
    print("="*50 + "\n")
    
    # Categorize results
    with_files = [r for r in results if r["has_file"]]
    without_files = [r for r in results if not r["has_file"]]
    
    print(f"Questions with files: {len(with_files)}")
    print(f"Questions without files: {len(without_files)}")
    print()
    
    for res in results:
        file_indicator = "📎" if res["has_file"] else "💬"
        print(f"{file_indicator} Task ID: {res['task_id']}")
        print(f"  Question: {res['question'][:80]}...")
        print(f"  Answer: {res['predicted_answer']}\n")

    print("\n--- Local Test Complete ---")


if __name__ == "__main__":
    # The load_dotenv call is now at the very top of the file
    # So this block simply calls the main test function.
    run_local_agent_test()