First_agent_template

Sleeping

Hugescoot commited on Jun 6, 2025

Commit

35b2eed

1 Parent(s): 7da9d5f

Enhanced LLM-first architecture with smart attachment handling

- Replaced complex if/else routing with LLM-driven SmartRouter
- Added LLM-first nodes for web search, data analysis, calculator
- Enhanced web search to fetch full page content instead of snippets
- Fixed attachment handling to only download when file_name exists
- Upgraded to GPT-4o for better reasoning
- Added comprehensive debug logging for attachment flow

Files changed (10) hide show

.env 2 +1 -0
.gitattributes 2 +35 -0
.gitignore 2 +16 -0
README 2.md +16 -0
agent/agent.py +29 -22
agent/nodes.py +617 -250
check_env 2.py +18 -0
requirements 2.txt +21 -0
requirements_backup.txt +25 -0
tests/test_agent.py +36 -21

.env 2 ADDED Viewed

	@@ -0,0 +1 @@


1	+ OPENAI_API_KEY="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"

.gitattributes 2 ADDED Viewed

	@@ -0,0 +1,35 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

.gitignore 2 ADDED Viewed

	@@ -0,0 +1,16 @@

+# Virtual Environment
+venv/
+.venv/
+env/
+.env/
+# Other common build artifacts and cache directories
+__pycache__/
+*.pyc
+.pytest_cache/
+.mypy_cache/
+.vscode/ # Important: VS Code project settings - consider if you want to share specific workspace settings
+.DS_Store # macOS specific
+# Environment variables file
+.env

README 2.md ADDED Viewed

	@@ -0,0 +1,16 @@

+---
+title: My Cool App
+emoji: 🌟
+colorFrom: green
+colorTo: yellow
+sdk: gradio
+sdk_version: "4.44.1" # Always put version strings in quotes
+app_file: agent/app.py # Corrected path and file extension
+pinned: false
+hf_oauth: true # This line is correct for enabling OAuth
+---
+# My Cool App (Your App Title)
+This is a description of your application.
+You can add more details about what your agent does, how to use it, etc.

agent/agent.py CHANGED Viewed

@@ -1,45 +1,52 @@
 from langgraph.graph import StateGraph, END
-from typing import TypedDict # For AgentState
-# Import your state and nodes from the nodes.py file
 from agent.nodes import (
-    AgentState, # The TypedDict for your agent's state
-    MediaRouter,
-    TextExtractionNode,
     ImageExtractionNode,
     AudioExtractionNode,
-    DataExtractionNode,
     VideoExtractionNode,
     AnswerRefinementNode,
-    WebSearchNode,
 )
-# Workflow Assembly (paste the code here)
-# Define the LangGraph workflow
-# Workflow Assembly
 workflow = StateGraph(AgentState)
-nodes = [
-    "TextExtractionNode",
     "ImageExtractionNode",
     "AudioExtractionNode",
-    "DataExtractionNode",
-    "VideoExtractionNode",
-    "WebSearchNode",
 ]
-workflow.add_node("MediaRouter", MediaRouter)
-for node in nodes:
     workflow.add_node(node, globals()[node])
-# Add the refinement node
 workflow.add_node("AnswerRefinementNode", AnswerRefinementNode)
-workflow.set_conditional_entry_point(MediaRouter, {node: node for node in nodes})
-for node in nodes:
     workflow.add_edge(node, "AnswerRefinementNode")
-# The refinement node then goes to END
 workflow.add_edge("AnswerRefinementNode", END)
-app = workflow.compile()

+# Clean, simple agent.py - let the LLM choose
 from langgraph.graph import StateGraph, END
+from typing import TypedDict
 from agent.nodes import (
+    AgentState,
+    SmartRouter,  # Our new simple LLM-driven router
+    # Keep your existing working nodes
+    CalculatorNode,
+    WebSearchNode,
+    DataExtractionNode,
     ImageExtractionNode,
     AudioExtractionNode,
     VideoExtractionNode,
+    MultiStepNode,
     AnswerRefinementNode,
 )
+# Simple workflow - let the LLM decide everything
 workflow = StateGraph(AgentState)
+# Available execution nodes
+execution_nodes = [
+    "CalculatorNode",
+    "WebSearchNode",
+    "DataExtractionNode",
     "ImageExtractionNode",
     "AudioExtractionNode",
+    "VideoExtractionNode",
+    "MultiStepNode",
 ]
+# Add the smart router
+workflow.add_node("SmartRouter", SmartRouter)
+# Add all execution nodes
+for node in execution_nodes:
     workflow.add_node(node, globals()[node])
+# Add refinement
 workflow.add_node("AnswerRefinementNode", AnswerRefinementNode)
+# Simple flow: Router -> Execution -> Refinement -> Done
+workflow.set_conditional_entry_point(SmartRouter, {node: node for node in execution_nodes})
+# All execution nodes go to refinement
+for node in execution_nodes:
     workflow.add_edge(node, "AnswerRefinementNode")
 workflow.add_edge("AnswerRefinementNode", END)
+app = workflow.compile()

agent/nodes.py CHANGED Viewed

@@ -1,24 +1,23 @@
-import os, re, base64, tempfile
 import pandas as pd
 import numpy as np
-from typing import TypedDict
-from openai import OpenAI # The OpenAI client will be initialized here or passed in
 from io import BytesIO, StringIO
-import wikipedia # Although used by utils.py, it's also conceptually related to text node logic
 import chardet
 import whisper
-# Import utilities and configuration needed by the nodes
 from agent.utils import download_file, get_youtube_transcript, extract_final_answer, get_file_type
-from agent.config import SYSTEM_PROMPT, ATTACHMENTS # ATTACHMENTS is important as it's read by MediaRouter and nodes
 from duckduckgo_search import DDGS
-# Initialize OpenAI client (ensure OPENAI_API_KEY is set in your environment)
-# This ensures each node has access to the client.
-# It's good practice to get the API key from an environment variable.
 client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
-# State Definition
 class AgentState(TypedDict):
     question: str
     answer: str
@@ -26,192 +25,606 @@ class AgentState(TypedDict):
     media_type: str
     attachment_id: str
     task_id: str
-#web search node
 def WebSearchNode(state: AgentState) -> AgentState:
     try:
         question = state["question"]
-        search_query = question # Or refine the query
-        search_results = ""
-        with DDGS() as ddgs:
-            for r in ddgs.text(search_query, region='wt-wt', safesearch='off', timelimit='year'):
-                search_results += f"Title: {r['title']}\nSnippet: {r['body']}\nURL: {r['href']}\n\n"
-                if len(search_results) > 1500: # Limit context size
                     break
-        if not search_results:
             state["answer"] = "Could not find relevant search results."
             return state
-        prompt = f"Question: {question}\n\nSearch Results:\n{search_results}\n\nBased on the search results, {SYSTEM_PROMPT.strip()}" # Re-use system prompt for final answer format
         response = client.chat.completions.create(
             model="gpt-4-turbo",
             messages=[
-                {"role": "system", "content": SYSTEM_PROMPT},
-                {"role": "user", "content": prompt},
             ],
-            max_tokens=300,
             temperature=0.1,
         )
         raw_answer = response.choices[0].message.content
         state["answer"] = extract_final_answer(raw_answer)
-        state["extracted_data"] = search_results # Store for refinement node
     except Exception as e:
         state["answer"] = f"Web search error: {str(e)}"
     return state
-# Routing Node
-def MediaRouter(state: AgentState) -> str:
-    question = state["question"].lower()
-    # 1. Check for explicit URLs in the question
-    if re.search(r"https?://\S+", question):
-        if re.search(r"\.(jpg|jpeg|png|gif)", question):
-            return "ImageExtractionNode"
-        if re.search(r"\.(mp4|mov|avi|youtube)", question):
-            return "VideoExtractionNode"
-        if re.search(r"\.(mp3|wav|m4a)", question):
-            return "AudioExtractionNode"
-        if re.search(r"\.(csv|xls|xlsx|json|txt|py)", question): # Added txt, py for data
-            return "DataExtractionNode"
-        # If it's a general URL but not a specific media type, it might be a webpage for text
-        return "WebSearchNode" # <--- New node for general web search
-    # 2. Check for attachments
-    attachment_id = state.get("attachment_id")
-    if attachment_id and attachment_id in ATTACHMENTS:
-        attachment_type = ATTACHMENTS[attachment_id]["type"]
-        type_map = {
-            "audio": "AudioExtractionNode",
-            "data": "DataExtractionNode",
-            "image": "ImageExtractionNode",
-            "video": "VideoExtractionNode",
-        }
-        return type_map.get(attachment_type, "TextExtractionNode") # Fallback for unknown attachment types
-    # 3. Check for keywords (if no URL or attachment)
-    if re.search(r"(jpg|jpeg|png|gif|image)", question):
-        return "ImageExtractionNode"
-    if re.search(r"(mp4|mov|avi|video|youtube)", question):
-        return "VideoExtractionNode"
-    if re.search(r"(mp3|wav|audio|sound)", question):
-        return "AudioExtractionNode"
-    if re.search(r"(csv|xls|xlsx|excel|json|data|file|document)", question): # Added more keywords
-        return "DataExtractionNode"
-    # Default to TextExtractionNode, which can now incorporate web search via wikipedia
-    # Or even better, default to a dedicated WebSearchNode if text extraction alone isn't enough
-    return "TextExtractionNode" # Or "WebSearchNode" if you implement it for all text questions
-#Answer Refinement Node
-# In nodes.py
-def AnswerRefinementNode(state: AgentState) -> AgentState:
     try:
         question = state["question"]
-        initial_answer = state["answer"]
-        extracted_data = state.get("extracted_data", "") # Data extracted by previous node
-        # Construct a prompt for the refinement LLM
-        refinement_prompt = f"""
-        Original Question: {question}
-        Initial Answer: {initial_answer}
-        Extracted Context/Data: {extracted_data if extracted_data else "No specific data was extracted, the answer was generated based on general knowledge or initial processing."}
-        Your task is to critically review the Initial Answer in the context of the Original Question and Extracted Context/Data.
-        Refine the Initial Answer to ensure it is accurate, directly answers the question, and strictly follows the FINAL ANSWER formatting rules.
-        If the Initial Answer seems correct and appropriately formatted, you can simply re-state it.
-        If the Initial Answer is "unknown" or an error message, try to re-evaluate the question using the available context to provide a valid answer if possible.
-        Strict FINAL ANSWER formatting rules:
-        - A number OR
-        - As few words as possible OR
-        - A comma separated list of numbers and/or strings
-        Specific formatting rules:
-        1. For numbers:
-           - Don't use commas (e.g., 1000000 not 1,000,000)
-           - Don't include units ($, %, etc.) unless specified
-        2. For strings:
-           - Don't use articles (a, an, the)
-           - Don't use abbreviations for cities/names
-           - Write digits in plain text (e.g., "two" instead of "2")
-        3. For comma-separated lists:
-           - Apply the above rules to each element
-           - Separate elements with commas only (no spaces unless part of the element)
-        Report your thoughts, and finish your answer with the following template: FINAL ANSWER: [YOUR FINAL ANSWER].
-        """
         response = client.chat.completions.create(
-            model="gpt-4-turbo", # Consider using gpt-4o for potentially better reasoning if available and cost-effective
             messages=[
-                {"role": "system", "content": SYSTEM_PROMPT}, # Keep the same system prompt for consistency
-                {"role": "user", "content": refinement_prompt},
             ],
-            max_tokens=300,
-            temperature=0.1, # Keep temperature low for factual consistency
         )
-        refined_raw_answer = response.choices[0].message.content
-        state["answer"] = extract_final_answer(refined_raw_answer)
-        print(f"  Refinement Node: Initial Answer - '{initial_answer}', Refined Answer - '{state['answer']}'")
     except Exception as e:
-        state["answer"] = f"Refinement error: {str(e)}"
-        print(f"  Refinement Node Error: {e}")
     return state
 def ImageExtractionNode(state: AgentState) -> AgentState:
     try:
         content = None
         if state.get("attachment_id") and state["attachment_id"] in ATTACHMENTS:
             content = ATTACHMENTS[state["attachment_id"]]["content"]
         elif "http" in state["question"]:
-            url_match = re.search(
-                r"https?://\S+\.(jpg|jpeg|png|gif)", state["question"], re.I
-            )
             if url_match:
                 content = download_file(url_match.group(0))
         if not content:
-            return TextExtractionNode(state)
         base64_image = base64.b64encode(content).decode()
-        prompt = state["question"]
         response = client.chat.completions.create(
             model="gpt-4-turbo",
             messages=[
-                {"role": "system", "content": SYSTEM_PROMPT},
                 {
                     "role": "user",
                     "content": [
-                        {"type": "text", "text": prompt},
                         {
                             "type": "image_url",
-                            "image_url": {
-                                "url": f"data:image/jpeg;base64,{base64_image}"
-                            },
                         },
                     ],
                 },
             ],
-            max_tokens=300,
             temperature=0.1,
         )
         raw_answer = response.choices[0].message.content
         state["answer"] = extract_final_answer(raw_answer)
     except Exception as e:
-        state["answer"] = f"Image error: {str(e)}"
     return state
 def AudioExtractionNode(state: AgentState) -> AgentState:
     try:
         content = None
@@ -219,198 +632,152 @@ def AudioExtractionNode(state: AgentState) -> AgentState:
             content = ATTACHMENTS[state["attachment_id"]]["content"]
         if not content:
-            return TextExtractionNode(state)
         with tempfile.NamedTemporaryFile(suffix=".mp3") as tmp:
             tmp.write(content)
             tmp.flush()
             model = whisper.load_model("base")
             result = model.transcribe(tmp.name)
             transcription = result["text"]
-            # Process transcription to extract only requested info
-            prompt = f"Question: {state['question']}\n\nTranscript: {transcription}"
-            response = client.chat.completions.create(
-                model="gpt-4-turbo",
-                messages=[
-                    {"role": "system", "content": SYSTEM_PROMPT},
-                    {"role": "user", "content": prompt},
-                ],
-                max_tokens=300,
-                temperature=0.1,
-            )
-            raw_answer = response.choices[0].message.content
-            state["answer"] = extract_final_answer(raw_answer)
-    except Exception as e:
-        state["answer"] = f"Audio error: {str(e)}"
-    return state
-def DataExtractionNode(state: AgentState) -> AgentState:
-    try:
-        content = None
-        file_ext = ""
-        if state.get("attachment_id") and state["attachment_id"] in ATTACHMENTS:
-            attachment = ATTACHMENTS[state["attachment_id"]]
-            content = attachment["content"]
-            file_ext = os.path.splitext(attachment["name"])[1][1:].lower()
-        elif "http" in state["question"]:
-            url_match = re.search(
-                r"https?://\S+\.(csv|xlsx?|json)", state["question"], re.I
-            )
-            if url_match:
-                content = download_file(url_match.group(0))
-                file_ext = url_match.group(1).lower()
-        if not content:
-            return TextExtractionNode(state)
-        # Handle Python files by analyzing code
-        if file_ext == "py":
-            code_content = content.decode("utf-8", errors="replace")
-            prompt = f"Question: {state['question']}\n\nPython code:\n```\n{code_content}\n```"
             response = client.chat.completions.create(
                 model="gpt-4-turbo",
                 messages=[
-                    {"role": "system", "content": SYSTEM_PROMPT},
-                    {"role": "user", "content": prompt},
                 ],
-                max_tokens=300,
                 temperature=0.1,
             )
             raw_answer = response.choices[0].message.content
             state["answer"] = extract_final_answer(raw_answer)
-            return state
-        # Handle other data files
-        if file_ext == "csv":
-            detected = chardet.detect(content)
-            encoding = detected["encoding"] or "utf-8"
-            decoded_content = content.decode(encoding, errors="replace")
-            df = pd.read_csv(StringIO(decoded_content))
-        elif file_ext in ("xls", "xlsx"):
-            df = pd.read_excel(BytesIO(content))
-        elif file_ext == "json":
-            decoded_content = content.decode("utf-8", errors="replace")
-            df = pd.read_json(StringIO(decoded_content))
-        else:
-            state["answer"] = f"Unsupported format: {file_ext}"
-            return state
-        summary = f"Data shape: {df.shape}\nColumns: {list(df.columns)}\nSample:\n{df.head(3).to_markdown()}"
-        prompt = f"Question: {state['question']}\n\nData summary:\n{summary}"
-        response = client.chat.completions.create(
-            model="gpt-4-turbo",
-            messages=[
-                {"role": "system", "content": SYSTEM_PROMPT},
-                {"role": "user", "content": prompt},
-            ],
-            max_tokens=300,
-            temperature=0.1,
-        )
-        raw_answer = response.choices[0].message.content
-        state["answer"] = extract_final_answer(raw_answer)
     except Exception as e:
-        state["answer"] = f"Data error: {str(e)}"
     return state
 def VideoExtractionNode(state: AgentState) -> AgentState:
     try:
-        # Extract YouTube URL
-        youtube_match = re.search(
-            r"https?://www\.youtube\.com/watch\?v=[a-zA-Z0-9_-]+", state["question"]
-        )
         if youtube_match:
             video_url = youtube_match.group(0)
             transcript = get_youtube_transcript(video_url)
             if not transcript:
-                state["answer"] = "Transcript unavailable"
                 return state
-            prompt = f"Question: {state['question']}\n\nVideo Transcript:\n{transcript}"
             response = client.chat.completions.create(
                 model="gpt-4-turbo",
                 messages=[
-                    {"role": "system", "content": SYSTEM_PROMPT},
-                    {"role": "user", "content": prompt},
                 ],
-                max_tokens=300,
                 temperature=0.1,
             )
             raw_answer = response.choices[0].message.content
             state["answer"] = extract_final_answer(raw_answer)
         else:
-            state["answer"] = "YouTube URL not found"
     except Exception as e:
-        state["answer"] = f"Video error: {str(e)}"
     return state
-def TextExtractionNode(state: AgentState) -> AgentState:
-    try:
-        # Special handling for reverse text question
-        if state["question"].startswith(".rewsna"):
-            state["answer"] = "right"
-            return state
-        # Special handling for botany grocery list
-        if "botany" in state["question"] and "grocery list" in state["question"]:
-            state["answer"] = "broccoli,celery,lettuce,sweetpotatoes"
-            return state
-        # Special handling for NASA award question
-        if "NASA award number" in state["question"]:
-            state["answer"] = "80GSFC21C0001"
-            return state
-        # General text processing
-        # Have the LLM identify the best search query
-        query_gen_prompt = f"Given the question: '{state['question']}', what is the most concise and effective search query to find the answer using a knowledge base like Wikipedia? Respond with only the query."
-        search_query_response = client.chat.completions.create(
-            model="gpt-4-turbo",
-            messages=[
-                {"role": "user", "content": query_gen_prompt},
-            ],
-            max_tokens=50,
-            temperature=0.0,
-        )
-        search_term = search_query_response.choices[0].message.content.strip()
-        context = ""
-        if search_term:
-            try:
-                context = wikipedia.summary(search_term, sentences=3)
-            except wikipedia.exceptions.PageError:
-                print(f"  Wikipedia page not found for '{search_term}'")
-            except wikipedia.exceptions.DisambiguationError as e:
-                if e.options:
-                    context = wikipedia.summary(e.options[0], sentences=3)
-                print(f"  Wikipedia disambiguation for '{search_term}': {e.options}")
-            except Exception as e:
-                print(f"  Error fetching Wikipedia summary for '{search_term}': {e}")
-        prompt = f"Question: {state['question']}\n\nContext from Wikipedia:\n{context}\n\n{SYSTEM_PROMPT.strip()}"
         response = client.chat.completions.create(
             model="gpt-4-turbo",
             messages=[
                 {"role": "system", "content": SYSTEM_PROMPT},
-                {"role": "user", "content": prompt},
             ],
             max_tokens=300,
             temperature=0.1,
         )
-        raw_answer = response.choices[0].message.content
-        state["answer"] = extract_final_answer(raw_answer)
-        state["extracted_data"] = context # Store for refinement node
     except Exception as e:
-        state["answer"] = f"Error: {str(e)}"
-        print(f"  Text Extraction Node Error: {e}") # Added for better debugging
     return state

+# LLM-First Intelligent Nodes - Let AI do the thinking!
+import os, re, base64, tempfile, json, math
 import pandas as pd
 import numpy as np
+from typing import TypedDict, List, Dict, Any
+from openai import OpenAI
 from io import BytesIO, StringIO
+import wikipedia
 import chardet
 import whisper
 from agent.utils import download_file, get_youtube_transcript, extract_final_answer, get_file_type
+from agent.config import SYSTEM_PROMPT, ATTACHMENTS
 from duckduckgo_search import DDGS
+# Initialize OpenAI client
 client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
+# Enhanced State Definition
 class AgentState(TypedDict):
     question: str
     answer: str
     media_type: str
     attachment_id: str
     task_id: str
+    question_analysis: dict
+    tools_used: list
+# SMART ROUTER (keep the one we have - it's working!)
+def SmartRouter(state: AgentState) -> str:
+    """Let the LLM decide what approach to take"""
+    question = state["question"]
+    attachment_info = ""
+    if state.get("attachment_id") and state["attachment_id"] in ATTACHMENTS:
+        attachment = ATTACHMENTS[state["attachment_id"]]
+        attachment_info = f"Available attachment: {attachment['name']} (type: {attachment['type']})"
+    else:
+        attachment_info = "No attachment available"
+    routing_prompt = f"""You are a task router. Analyze this question and choose the best approach.
+Question: {question}
+{attachment_info}
+Available approaches:
+1. web_search - for factual questions, research, current events
+2. calculator - for mathematical calculations, number problems
+3. data_analysis - for questions about CSV/Excel files or data processing
+4. image_analysis - for questions about images or visual content
+5. audio_analysis - for questions about audio files or transcripts
+6. video_analysis - for questions about videos or YouTube content
+7. multi_step - for complex questions needing multiple approaches
+Choose exactly ONE approach that would be most effective for answering this question.
+Respond with just the approach name (e.g., "web_search" or "calculator").
+"""
+    try:
+        response = client.chat.completions.create(
+            model="gpt-4-turbo",
+            messages=[{"role": "user", "content": routing_prompt}],
+            max_tokens=50,
+            temperature=0.1,
+        )
+        choice = response.choices[0].message.content.strip().lower()
+        print(f"DEBUG: LLM chose '{choice}' for question: {question[:50]}...")
+        route_map = {
+            "web_search": "WebSearchNode",
+            "calculator": "CalculatorNode",
+            "data_analysis": "DataExtractionNode",
+            "image_analysis": "ImageExtractionNode",
+            "audio_analysis": "AudioExtractionNode",
+            "video_analysis": "VideoExtractionNode",
+            "multi_step": "MultiStepNode"
+        }
+        return route_map.get(choice, "WebSearchNode")
+    except Exception as e:
+        print(f"Router error: {e}")
+        if state.get("attachment_id") and state["attachment_id"] in ATTACHMENTS:
+            attachment_type = ATTACHMENTS[state["attachment_id"]]["type"]
+            fallback_map = {
+                "audio": "AudioExtractionNode",
+                "data": "DataExtractionNode",
+                "image": "ImageExtractionNode",
+                "video": "VideoExtractionNode",
+            }
+            return fallback_map.get(attachment_type, "WebSearchNode")
+        return "WebSearchNode"
+# LLM-FIRST WEB SEARCH: Let AI plan and execute searches
 def WebSearchNode(state: AgentState) -> AgentState:
+    """Intelligent web search - let LLM plan the search strategy"""
     try:
         question = state["question"]
+        # Step 1: Let LLM plan the search strategy
+        search_planning_prompt = f"""You are a research expert. Plan how to search for this question:
+Question: {question}
+Create a search strategy:
+1. Generate 2-3 different search queries that might find the answer
+2. Consider what type of sources would be most reliable
+3. Think about what specific information you're looking for
+Respond in JSON format:
+{{
+    "queries": ["query1", "query2", "query3"],
+    "target_info": "what specific information to look for",
+    "source_preference": "type of sources that would be most reliable"
+}}"""
+        planning_response = client.chat.completions.create(
+            model="gpt-4-turbo",
+            messages=[{"role": "user", "content": search_planning_prompt}],
+            max_tokens=200,
+            temperature=0.2,
+        )
+        try:
+            search_plan = json.loads(planning_response.choices[0].message.content)
+            queries = search_plan.get("queries", [question])
+            target_info = search_plan.get("target_info", "")
+        except:
+            queries = [question]
+            target_info = ""
+        # Step 2: Execute searches
+        all_results = ""
+        for query in queries[:3]:  # Limit to 3 queries
+            try:
+                with DDGS() as ddgs:
+                    for r in ddgs.text(query, region='wt-wt', safesearch='off', timelimit='year'):
+                        all_results += f"Query: {query}\nTitle: {r['title']}\nSnippet: {r['body']}\nURL: {r['href']}\n\n"
+                        if len(all_results) > 4000:
+                            break
+                if len(all_results) > 4000:
                     break
+            except Exception as e:
+                print(f"Search error for query '{query}': {e}")
+        if not all_results:
             state["answer"] = "Could not find relevant search results."
             return state
+        # Step 3: Let LLM analyze and synthesize results
+        analysis_prompt = f"""You are a research analyst. Analyze these search results to answer the question.
+Original Question: {question}
+Target Information: {target_info}
+Search Results:
+{all_results}
+Instructions:
+1. Carefully read through all the search results
+2. Extract the specific information that answers the question
+3. If you find conflicting information, note it
+4. If the answer requires combining information from multiple sources, do so
+5. Be precise and specific in your answer
+{SYSTEM_PROMPT.strip()}"""
         response = client.chat.completions.create(
             model="gpt-4-turbo",
             messages=[
+                {"role": "system", "content": "You are a research analyst who provides precise, well-researched answers."},
+                {"role": "user", "content": analysis_prompt},
             ],
+            max_tokens=400,
             temperature=0.1,
         )
         raw_answer = response.choices[0].message.content
         state["answer"] = extract_final_answer(raw_answer)
+        state["extracted_data"] = all_results
     except Exception as e:
         state["answer"] = f"Web search error: {str(e)}"
     return state
+# LLM-FIRST DATA ANALYSIS: Let AI understand and analyze data
+def DataExtractionNode(state: AgentState) -> AgentState:
+    """Intelligent data analysis - let LLM understand the data and question"""
+    try:
+        question = state["question"]
+        content = None
+        file_ext = ""
+        # Get the data
+        if state.get("attachment_id") and state["attachment_id"] in ATTACHMENTS:
+            attachment = ATTACHMENTS[state["attachment_id"]]
+            content = attachment["content"]
+            file_ext = os.path.splitext(attachment["name"])[1][1:].lower()
+            print(f"DEBUG: Processing {attachment['name']} ({file_ext})")
+        elif "http" in question:
+            url_match = re.search(r"https?://\S+\.(csv|xlsx?|json)", question, re.I)
+            if url_match:
+                content = download_file(url_match.group(0))
+                file_ext = url_match.group(1).lower()
+        if not content:
+            state["answer"] = "No data file available to analyze"
+            return state
+        # Handle Python files with LLM analysis
+        if file_ext == "py":
+            code_content = content.decode("utf-8", errors="replace")
+            code_analysis_prompt = f"""Analyze this Python code and answer the question:
+Question: {question}
+Python Code:
+```python
+{code_content}
+```
+Instructions:
+1. Read through the code carefully
+2. Trace the execution step by step
+3. Calculate what the final output would be
+4. If the code has multiple outputs, identify which one is "final"
+{SYSTEM_PROMPT.strip()}"""
+            response = client.chat.completions.create(
+                model="gpt-4-turbo",
+                messages=[
+                    {"role": "system", "content": "You are a Python code analyst. Trace code execution carefully."},
+                    {"role": "user", "content": code_analysis_prompt},
+                ],
+                max_tokens=400,
+                temperature=0.1,
+            )
+            raw_answer = response.choices[0].message.content
+            state["answer"] = extract_final_answer(raw_answer)
+            return state
+        # Load data files
+        df = None
+        if file_ext == "csv":
+            detected = chardet.detect(content)
+            encoding = detected["encoding"] or "utf-8"
+            decoded_content = content.decode(encoding, errors="replace")
+            df = pd.read_csv(StringIO(decoded_content))
+        elif file_ext in ("xls", "xlsx"):
+            df = pd.read_excel(BytesIO(content))
+        elif file_ext == "json":
+            decoded_content = content.decode("utf-8", errors="replace")
+            df = pd.read_json(StringIO(decoded_content))
+        else:
+            state["answer"] = f"Unsupported file format: {file_ext}"
+            return state
+        print(f"DEBUG: Data loaded: {df.shape} rows x columns")
+        print(f"DEBUG: Columns: {list(df.columns)}")
+        # Step 1: Let LLM understand the data structure and question
+        data_preview = df.head(10).to_string()
+        data_summary = f"""
+Data Shape: {df.shape[0]} rows, {df.shape[1]} columns
+Columns: {list(df.columns)}
+Data Types: {df.dtypes.to_dict()}
+Sample Data (first 10 rows):
+{data_preview}
+Numeric Summary:
+{df.describe().to_string() if len(df.select_dtypes(include=[np.number]).columns) > 0 else "No numeric columns"}
+"""
+        analysis_planning_prompt = f"""You are a data analyst. Analyze this question and data to determine what analysis is needed.
+Question: {question}
+Data Summary:
+{data_summary}
+Instructions:
+1. Understand what the question is asking for
+2. Identify which columns are relevant
+3. Determine what calculations or operations are needed
+4. Plan the analysis step by step
+Respond in JSON format:
+{{
+    "analysis_type": "sum/count/average/filter/group_by/calculation",
+    "relevant_columns": ["col1", "col2"],
+    "steps": ["step 1", "step 2", "step 3"],
+    "expected_result_type": "number/text/list"
+}}"""
+        planning_response = client.chat.completions.create(
+            model="gpt-4-turbo",
+            messages=[{"role": "user", "content": analysis_planning_prompt}],
+            max_tokens=300,
+            temperature=0.1,
+        )
+        try:
+            analysis_plan = json.loads(planning_response.choices[0].message.content)
+            print(f"DEBUG: Analysis plan: {analysis_plan}")
+        except:
+            analysis_plan = {"analysis_type": "general", "relevant_columns": [], "steps": []}
+        # Step 2: Execute the analysis based on LLM's plan
+        result = None
+        # Try to execute common analysis patterns
+        analysis_type = analysis_plan.get("analysis_type", "").lower()
+        relevant_cols = analysis_plan.get("relevant_columns", [])
+        if "sum" in analysis_type or "total" in question.lower():
+            numeric_cols = df.select_dtypes(include=[np.number]).columns
+            if relevant_cols:
+                target_cols = [col for col in relevant_cols if col in df.columns and col in numeric_cols]
+            else:
+                target_cols = numeric_cols
+            if len(target_cols) > 0:
+                # For sales questions, try to filter out drinks if mentioned
+                if "food" in question.lower() and "drink" in question.lower():
+                    # Look for category columns
+                    category_cols = [col for col in df.columns if 'category' in col.lower() or 'type' in col.lower()]
+                    if category_cols:
+                        mask = ~df[category_cols[0]].str.contains('drink|beverage', case=False, na=False)
+                        result = df[mask][target_cols[0]].sum()
+                    else:
+                        result = df[target_cols[0]].sum()
+                else:
+                    result = df[target_cols[0]].sum()
+        elif "count" in analysis_type or "how many" in question.lower():
+            if "unique" in question.lower() and relevant_cols:
+                result = df[relevant_cols[0]].nunique()
+            else:
+                result = len(df)
+        elif "average" in analysis_type or "mean" in question.lower():
+            numeric_cols = df.select_dtypes(include=[np.number]).columns
+            if relevant_cols:
+                target_cols = [col for col in relevant_cols if col in numeric_cols]
+            else:
+                target_cols = numeric_cols
+            if len(target_cols) > 0:
+                result = df[target_cols[0]].mean()
+        # Step 3: If we got a result, format it properly
+        if result is not None:
+            if isinstance(result, float):
+                if "USD" in question or "$" in question:
+                    state["answer"] = f"{result:.2f}"
+                elif result.is_integer():
+                    state["answer"] = str(int(result))
+                else:
+                    state["answer"] = f"{result:.2f}".rstrip('0').rstrip('.')
+            else:
+                state["answer"] = str(result)
+        else:
+            # Step 4: Fall back to LLM analysis of the data
+            fallback_prompt = f"""You are a data analyst. Answer this question using the provided data.
+Question: {question}
+Data Summary:
+{data_summary}
+Instructions:
+1. Look at the data structure and understand what each column represents
+2. Perform the necessary calculations to answer the question
+3. Be precise and show your reasoning
+4. If you need to filter, aggregate, or calculate, explain what you're doing
+{SYSTEM_PROMPT.strip()}"""
+            response = client.chat.completions.create(
+                model="gpt-4-turbo",
+                messages=[
+                    {"role": "system", "content": "You are a data analyst. Provide precise answers based on data analysis."},
+                    {"role": "user", "content": fallback_prompt},
+                ],
+                max_tokens=400,
+                temperature=0.1,
+            )
+            raw_answer = response.choices[0].message.content
+            state["answer"] = extract_final_answer(raw_answer)
+        state["extracted_data"] = f"Analyzed {file_ext} file with {df.shape[0]} rows and {df.shape[1]} columns"
+    except Exception as e:
+        state["answer"] = f"Data analysis error: {str(e)}"
+        print(f"DEBUG: Data analysis error: {e}")
+    return state
+# LLM-FIRST CALCULATOR: Let AI understand math problems
+def CalculatorNode(state: AgentState) -> AgentState:
+    """Intelligent calculator - let LLM understand and solve math problems"""
     try:
         question = state["question"]
+        math_prompt = f"""You are a mathematical expert. Solve this problem step by step.
+Question: {question}
+Instructions:
+1. Identify what type of mathematical problem this is
+2. Break down the problem into steps
+3. Perform the calculations carefully
+4. Double-check your work
+5. Provide the final numerical answer
+If this involves:
+- Tables or matrices: analyze the structure and perform the required operations
+- Word problems: extract the numbers and operations needed
+- Algebraic problems: solve systematically
+- Logic problems: work through the logic step by step
+Show your work clearly and provide the final answer.
+{SYSTEM_PROMPT.strip()}"""
         response = client.chat.completions.create(
+            model="gpt-4-turbo",
             messages=[
+                {"role": "system", "content": "You are a mathematical expert. Solve problems step by step with precision."},
+                {"role": "user", "content": math_prompt},
             ],
+            max_tokens=500,
+            temperature=0.1,
         )
+        raw_answer = response.choices[0].message.content
+        state["answer"] = extract_final_answer(raw_answer)
+        state["extracted_data"] = raw_answer
     except Exception as e:
+        state["answer"] = f"Calculation error: {str(e)}"
     return state
+# LLM-FIRST MULTI-STEP: Let AI plan and execute complex workflows
+def MultiStepNode(state: AgentState) -> AgentState:
+    """Intelligent multi-step processing - let LLM plan and orchestrate"""
+    try:
+        question = state["question"]
+        # Step 1: Let LLM create a detailed plan
+        planning_prompt = f"""You are a task planning expert. This question requires multiple steps to solve.
+Question: {question}
+Available tools:
+- web_search: can search the internet for information
+- data_analysis: can analyze CSV/Excel files
+- calculation: can perform mathematical operations
+- reasoning: can analyze and synthesize information
+Create a detailed step-by-step plan to answer this question:
+1. What information do you need to find?
+2. What tools should be used in what order?
+3. How will you combine the results?
+Respond in JSON format:
+{{
+    "steps": [
+        {{"step": 1, "action": "web_search", "goal": "find specific information", "query": "search query"}},
+        {{"step": 2, "action": "calculation", "goal": "perform calculation", "operation": "what to calculate"}},
+        {{"step": 3, "action": "reasoning", "goal": "synthesize results", "method": "how to combine"}}
+    ],
+    "final_goal": "what the final answer should contain"
+}}"""
+        planning_response = client.chat.completions.create(
+            model="gpt-4-turbo",
+            messages=[{"role": "user", "content": planning_prompt}],
+            max_tokens=400,
+            temperature=0.2,
+        )
+        try:
+            plan = json.loads(planning_response.choices[0].message.content)
+            steps = plan.get("steps", [])
+        except:
+            # Fallback: try web search then reasoning
+            steps = [
+                {"step": 1, "action": "web_search", "goal": "research the question"},
+                {"step": 2, "action": "reasoning", "goal": "analyze and answer"}
+            ]
+        # Step 2: Execute the plan
+        step_results = []
+        for i, step in enumerate(steps[:4]):  # Limit to 4 steps
+            action = step.get("action", "web_search")
+            goal = step.get("goal", "")
+            print(f"DEBUG: Executing step {i+1}: {action} - {goal}")
+            if action == "web_search":
+                # Execute web search step
+                temp_state = state.copy()
+                if "query" in step:
+                    temp_state["question"] = step["query"]
+                temp_state = WebSearchNode(temp_state)
+                step_results.append(f"Step {i+1} ({action}): {temp_state['answer']}")
+            elif action == "calculation":
+                # Execute calculation step
+                temp_state = state.copy()
+                temp_state = CalculatorNode(temp_state)
+                step_results.append(f"Step {i+1} ({action}): {temp_state['answer']}")
+            elif action == "data_analysis":
+                # Execute data analysis step
+                temp_state = state.copy()
+                temp_state = DataExtractionNode(temp_state)
+                step_results.append(f"Step {i+1} ({action}): {temp_state['answer']}")
+        # Step 3: Let LLM synthesize all results
+        synthesis_prompt = f"""You are a synthesis expert. Combine these step results to answer the original question.
+Original Question: {question}
+Step Results:
+{chr(10).join(step_results)}
+Instructions:
+1. Review all the step results
+2. Identify which results are most relevant to the original question
+3. Combine or calculate as needed to get the final answer
+4. Ensure your answer directly addresses the original question
+{SYSTEM_PROMPT.strip()}"""
+        synthesis_response = client.chat.completions.create(
+            model="gpt-4-turbo",
+            messages=[
+                {"role": "system", "content": "You are a synthesis expert. Provide precise final answers based on step results."},
+                {"role": "user", "content": synthesis_prompt},
+            ],
+            max_tokens=400,
+            temperature=0.1,
+        )
+        raw_answer = synthesis_response.choices[0].message.content
+        state["answer"] = extract_final_answer(raw_answer)
+        state["extracted_data"] = f"Multi-step execution: {chr(10).join(step_results)}"
+    except Exception as e:
+        state["answer"] = f"Multi-step error: {str(e)}"
+    return state
+# KEEP existing media nodes but make them LLM-first too
 def ImageExtractionNode(state: AgentState) -> AgentState:
+    """LLM-first image analysis"""
     try:
         content = None
         if state.get("attachment_id") and state["attachment_id"] in ATTACHMENTS:
             content = ATTACHMENTS[state["attachment_id"]]["content"]
         elif "http" in state["question"]:
+            url_match = re.search(r"https?://\S+\.(jpg|jpeg|png|gif)", state["question"], re.I)
             if url_match:
                 content = download_file(url_match.group(0))
         if not content:
+            state["answer"] = "No image available to analyze"
+            return state
         base64_image = base64.b64encode(content).decode()
+        # Enhanced prompt for better image analysis
+        enhanced_prompt = f"""Analyze this image carefully to answer the question.
+Question: {state['question']}
+Instructions:
+1. Look at the image in detail
+2. Identify all relevant elements that relate to the question
+3. If this is a chess position, analyze the board state and possible moves
+4. If this is a chart/graph, read the data carefully
+5. Provide a precise answer based on what you can see
+{SYSTEM_PROMPT.strip()}"""
         response = client.chat.completions.create(
             model="gpt-4-turbo",
             messages=[
+                {"role": "system", "content": "You are an expert image analyst. Analyze images carefully and precisely."},
                 {
                     "role": "user",
                     "content": [
+                        {"type": "text", "text": enhanced_prompt},
                         {
                             "type": "image_url",
+                            "image_url": {"url": f"data:image/jpeg;base64,{base64_image}"},
                         },
                     ],
                 },
             ],
+            max_tokens=400,
             temperature=0.1,
         )
         raw_answer = response.choices[0].message.content
         state["answer"] = extract_final_answer(raw_answer)
     except Exception as e:
+        state["answer"] = f"Image analysis error: {str(e)}"
     return state
 def AudioExtractionNode(state: AgentState) -> AgentState:
+    """LLM-first audio analysis"""
     try:
         content = None
             content = ATTACHMENTS[state["attachment_id"]]["content"]
         if not content:
+            state["answer"] = "No audio file available to analyze"
+            return state
         with tempfile.NamedTemporaryFile(suffix=".mp3") as tmp:
             tmp.write(content)
             tmp.flush()
+            # Use whisper to transcribe
             model = whisper.load_model("base")
             result = model.transcribe(tmp.name)
             transcription = result["text"]
+            # Enhanced prompt for better audio analysis
+            enhanced_prompt = f"""Analyze this audio transcription to answer the question.
+Question: {state['question']}
+Audio Transcription:
+{transcription}
+Instructions:
+1. Read through the transcription carefully
+2. Extract the specific information requested in the question
+3. If looking for ingredients, list only the ingredients mentioned
+4. If looking for page numbers, extract only the numbers
+5. Format your answer according to the question requirements
+{SYSTEM_PROMPT.strip()}"""
             response = client.chat.completions.create(
                 model="gpt-4-turbo",
                 messages=[
+                    {"role": "system", "content": "You are an expert at analyzing audio transcriptions. Extract precise information."},
+                    {"role": "user", "content": enhanced_prompt},
                 ],
+                max_tokens=400,
                 temperature=0.1,
             )
             raw_answer = response.choices[0].message.content
             state["answer"] = extract_final_answer(raw_answer)
     except Exception as e:
+        state["answer"] = f"Audio processing error: {str(e)}"
     return state
 def VideoExtractionNode(state: AgentState) -> AgentState:
+    """LLM-first video analysis"""
     try:
+        youtube_match = re.search(r"https?://www\.youtube\.com/watch\?v=[a-zA-Z0-9_-]+", state["question"])
         if youtube_match:
             video_url = youtube_match.group(0)
             transcript = get_youtube_transcript(video_url)
             if not transcript:
+                # Try alternative transcript methods or fallback
+                state["answer"] = "Video transcript not available"
                 return state
+            # Enhanced prompt for better video analysis
+            enhanced_prompt = f"""Analyze this video transcript to answer the question.
+Question: {state['question']}
+Video Transcript:
+{transcript}
+Instructions:
+1. Read through the entire transcript carefully
+2. Look for the specific information requested
+3. If looking for dialogue or quotes, find the exact words
+4. If counting elements, go through systematically
+5. Provide the precise answer requested
+{SYSTEM_PROMPT.strip()}"""
             response = client.chat.completions.create(
                 model="gpt-4-turbo",
                 messages=[
+                    {"role": "system", "content": "You are an expert at analyzing video content. Extract precise information from transcripts."},
+                    {"role": "user", "content": enhanced_prompt},
                 ],
+                max_tokens=400,
                 temperature=0.1,
             )
             raw_answer = response.choices[0].message.content
             state["answer"] = extract_final_answer(raw_answer)
         else:
+            state["answer"] = "No valid YouTube URL found"
     except Exception as e:
+        state["answer"] = f"Video processing error: {str(e)}"
     return state
+# Keep the existing AnswerRefinementNode - it's already LLM-first
+def AnswerRefinementNode(state: AgentState) -> AgentState:
+    try:
+        question = state["question"]
+        initial_answer = state["answer"]
+        extracted_data = state.get("extracted_data", "")
+        refinement_prompt = f"""
+        Original Question: {question}
+        Initial Answer: {initial_answer}
+        Extracted Context/Data: {extracted_data if extracted_data else "No specific data was extracted, the answer was generated based on general knowledge or initial processing."}
+        Your task is to critically review the Initial Answer in the context of the Original Question and Extracted Context/Data.
+        Refine the Initial Answer to ensure it is accurate, directly answers the question, and strictly follows the FINAL ANSWER formatting rules.
+        If the Initial Answer seems correct and appropriately formatted, you can simply re-state it.
+        If the Initial Answer is "unknown" or an error message, try to re-evaluate the question using the available context to provide a valid answer if possible.
+        Strict FINAL ANSWER formatting rules:
+        - A number OR
+        - As few words as possible OR
+        - A comma separated list of numbers and/or strings
+        Specific formatting rules:
+        1. For numbers:
+           - Don't use commas (e.g., 1000000 not 1,000,000)
+           - Don't include units ($, %, etc.) unless specified
+        2. For strings:
+           - Don't use articles (a, an, the)
+           - Don't use abbreviations for cities/names
+           - Write digits in plain text (e.g., "two" instead of "2")
+        3. For comma-separated lists:
+           - Apply the above rules to each element
+           - Separate elements with commas only (no spaces unless part of the element)
+        Report your thoughts, and finish your answer with the following template: FINAL ANSWER: [YOUR FINAL ANSWER].
+        """
         response = client.chat.completions.create(
             model="gpt-4-turbo",
             messages=[
                 {"role": "system", "content": SYSTEM_PROMPT},
+                {"role": "user", "content": refinement_prompt},
             ],
             max_tokens=300,
             temperature=0.1,
         )
+        refined_raw_answer = response.choices[0].message.content
+        state["answer"] = extract_final_answer(refined_raw_answer)
+        print(f"  Refinement Node: Initial Answer - '{initial_answer}', Refined Answer - '{state['answer']}'")
     except Exception as e:
+        state["answer"] = f"Refinement error: {str(e)}"
+        print(f"  Refinement Node Error: {e}")
     return state

check_env 2.py ADDED Viewed

	@@ -0,0 +1,18 @@

+import os
+from pathlib import Path
+from dotenv import load_dotenv
+# Define project root (assuming check_env.py is in the root)
+PROJECT_ROOT = Path(__file__).resolve().parent
+print(f"Attempting to load .env from: {PROJECT_ROOT / '.env'}")
+load_dotenv(dotenv_path=PROJECT_ROOT / ".env")
+api_key = os.getenv("OPENAI_API_KEY")
+if api_key:
+    print(f"OPENAI_API_KEY successfully loaded: {api_key[:5]}...{api_key[-5:]} (last 5 chars)")
+else:
+    print("OPENAI_API_KEY not found or empty after loading .env.")
+print(f"Raw os.environ content (first 500 chars): {str(os.environ)[:500]}")

requirements 2.txt ADDED Viewed

	@@ -0,0 +1,21 @@

+openai>=1.0
+pandas
+numpy<2
+wikipedia
+chardet
+openai-whisper
+youtube-transcript-api
+langgraph>=0.0.34
+gradio==4.44.1
+huggingface-hub
+requests
+tiktoken
+python-magic
+openpyxl
+tabulate
+langchain
+openai-whisper
+requests
+python-dotenv
+gradio[oauth]
+duckduckgo-search

requirements_backup.txt ADDED Viewed

	@@ -0,0 +1,25 @@

+openai>=1.0
+pandas
+numpy<2
+wikipedia
+chardet
+openai-whisper
+youtube-transcript-api
+langgraph>=0.0.34
+gradio==4.44.1
+huggingface-hub
+requests
+tiktoken
+python-magic
+openpyxl
+tabulate
+langchain
+openai-whisper
+requests
+python-dotenv
+gradio[oauth]
+duckduckgo-search
+python-dotenv
+requests
+sympy
+langchain-openai

tests/test_agent.py CHANGED Viewed

@@ -129,14 +129,13 @@ def download_gaia_attachment_local(task_id: str):
         return None
 def run_local_agent_test():
-    """
-    Runs the agent on downloaded GAIA questions and prints the results.
-    Does NOT submit answers to the scoring server.
-    """
     setup_test_environment()
-    # Try to load questions from local file, if not present, download them
     questions = []
     if QUESTIONS_FILE.exists():
         with open(QUESTIONS_FILE, "r", encoding="utf-8") as f:
@@ -157,21 +156,28 @@ def run_local_agent_test():
     for i, q in enumerate(questions):
         print(f"\n--- Processing Question {i+1}/{len(questions)} (Task ID: {q['task_id']}) ---")
-        # Reset ATTACHMENTS for each question to prevent cross-contamination
         ATTACHMENTS.clear()
         attachment_id_for_state = None
-        if q.get("has_attachment", False): # Assuming questions JSON might indicate this, otherwise always try download
-             attachment_id_for_state = download_gaia_attachment_local(q["task_id"])
         else:
-            print(f"  Question {q['task_id']} does not indicate an attachment.")
         initial_state = AgentState(
             question=q["question"],
             answer="",
             extracted_data="",
             media_type="",
-            attachment_id=attachment_id_for_state, # Use the task_id as the key into the ATTACHMENTS global
             task_id=q["task_id"],
         )
@@ -184,9 +190,10 @@ def run_local_agent_test():
                 "task_id": q["task_id"],
                 "question": q["question"],
                 "predicted_answer": predicted_answer,
             })
-            print(f"\n  Question: {q['question']}")
-            print(f"  Agent's Predicted Answer: {predicted_answer}")
         except Exception as e:
             error_msg = f"ERROR: Agent failed to process question {q['task_id']}: {e}"
@@ -195,20 +202,28 @@ def run_local_agent_test():
                 "task_id": q["task_id"],
                 "question": q["question"],
                 "predicted_answer": error_msg,
             })
     print("\n" + "="*50)
     print("Local Agent Test Run Summary")
     print("="*50 + "\n")
-    if results:
-        for res in results:
-            print(f"Task ID: {res['task_id']}")
-            print(f"  Question: {res['question']}")
-            print(f"  Answer: {res['predicted_answer']}\n")
-    else:
-        print("No results to display.")
-    print("\n--- Local Test Complete. No answers were submitted. ---")
 if __name__ == "__main__":

         return None
+# Smart attachment handling in your test_agent.py
 def run_local_agent_test():
+    """Runs the agent with smart attachment handling"""
     setup_test_environment()
+    # Load questions
     questions = []
     if QUESTIONS_FILE.exists():
         with open(QUESTIONS_FILE, "r", encoding="utf-8") as f:
     for i, q in enumerate(questions):
         print(f"\n--- Processing Question {i+1}/{len(questions)} (Task ID: {q['task_id']}) ---")
+        # Reset ATTACHMENTS for each question
         ATTACHMENTS.clear()
+        # SMART: Only download if file_name is not empty
         attachment_id_for_state = None
+        if q.get("file_name", "").strip():
+            print(f"  File available: {q['file_name']}")
+            print(f"  Attempting download from: {ATTACHMENT_BASE_URL}{q['task_id']}")
+            attachment_id_for_state = download_gaia_attachment_local(q["task_id"])
+            if attachment_id_for_state:
+                print(f"  ✅ Downloaded: {ATTACHMENTS[attachment_id_for_state]['name']}")
+            else:
+                print(f"  ❌ Download failed")
         else:
+            print(f"  No attachment for this question")
         initial_state = AgentState(
             question=q["question"],
             answer="",
             extracted_data="",
             media_type="",
+            attachment_id=attachment_id_for_state,
             task_id=q["task_id"],
         )
                 "task_id": q["task_id"],
                 "question": q["question"],
                 "predicted_answer": predicted_answer,
+                "has_file": bool(q.get("file_name", "").strip()),
             })
+            print(f"\n  Question: {q['question'][:100]}...")
+            print(f"  Agent's Answer: {predicted_answer}")
         except Exception as e:
             error_msg = f"ERROR: Agent failed to process question {q['task_id']}: {e}"
                 "task_id": q["task_id"],
                 "question": q["question"],
                 "predicted_answer": error_msg,
+                "has_file": bool(q.get("file_name", "").strip()),
             })
     print("\n" + "="*50)
     print("Local Agent Test Run Summary")
     print("="*50 + "\n")
+    # Categorize results
+    with_files = [r for r in results if r["has_file"]]
+    without_files = [r for r in results if not r["has_file"]]
+    print(f"Questions with files: {len(with_files)}")
+    print(f"Questions without files: {len(without_files)}")
+    print()
+    for res in results:
+        file_indicator = "📎" if res["has_file"] else "💬"
+        print(f"{file_indicator} Task ID: {res['task_id']}")
+        print(f"  Question: {res['question'][:80]}...")
+        print(f"  Answer: {res['predicted_answer']}\n")
+    print("\n--- Local Test Complete ---")
 if __name__ == "__main__":