Spaces:

mabelwang21
/

Agents_Final_Assignment

Sleeping

App Files Files Community

mabelwang21 commited on May 5, 2025

Commit

97c9b88

1 Parent(s): f3a76b7

init test simple agent

Browse files

Files changed (7) hide show

README.md +2 -0
agent.py +118 -0
app.py +198 -0
metadata.jsonl +0 -0
requirements.txt +10 -0
tool_counts.csv +94 -0
view_jsonfile.ipynb +381 -0

README.md CHANGED Viewed

@@ -7,6 +7,8 @@ sdk: gradio
 sdk_version: 5.27.0
 app_file: app.py
 pinned: false
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 sdk_version: 5.27.0
 app_file: app.py
 pinned: false
+hf_oauth: true
+hf_oauth_expiration_minutes: 480
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

agent.py ADDED Viewed

	@@ -0,0 +1,118 @@

+from smolagents import ToolCallingAgent, tool
+from langchain_community.tools import DuckDuckGoSearchRun
+from langchain_community.utilities import WikipediaAPIWrapper
+from langchain.tools import BaseTool
+from PIL import Image
+import pytesseract
+import fitz
+import ast
+import os
+# -------------------- TOOL DEFINITIONS --------------------
+@tool
+def web_search(query: str) -> str:
+    """
+    Search the web using DuckDuckGo.
+    Args:
+        query (str): The search query string.
+    Returns:
+        str: Summary of search results.
+    """
+    search = DuckDuckGoSearchRun()
+    return search.run(query)
+@tool
+def wikipedia_search(query: str) -> str:
+    """
+    Look up a topic on Wikipedia and return relevant content.
+    Args:
+        query (str): The topic or term to search on Wikipedia.
+    Returns:
+        str: Extracted Wikipedia content.
+    """
+    wiki = WikipediaQueryRun()
+    return wiki.run(query)
+@tool
+def image_recognition(image_path: str) -> str:
+    """
+    Perform OCR on an image to extract text.
+    Args:
+        image_path (str): Path to the image file.
+    Returns:
+        str: Extracted text from the image.
+    """
+    img = Image.open(image_path)
+    return pytesseract.image_to_string(img)
+@tool
+def read_pdf(pdf_path: str) -> str:
+    """
+    Extract all text from a PDF document.
+    Args:
+        pdf_path (str): Path to the PDF file.
+    Returns:
+        str: Text content of the PDF.
+    """
+    doc = fitz.open(pdf_path)
+    return "".join(page.get_text() for page in doc)
+@tool
+def calculate(expr: str) -> float:
+    """
+    Evaluate a simple math expression.
+    Args:
+        expr (str): The math expression to evaluate.
+    Returns:
+        float: Result of the expression.
+    """
+    def _eval(node):
+        if isinstance(node, ast.BinOp):
+            left = _eval(node.left)
+            right = _eval(node.right)
+            if isinstance(node.op, ast.Add): return left + right
+            if isinstance(node.op, ast.Sub): return left - right
+            if isinstance(node.op, ast.Mult): return left * right
+            if isinstance(node.op, ast.Div): return left / right
+            if isinstance(node.op, ast.Pow): return left ** right
+        elif isinstance(node, ast.UnaryOp):
+            operand = _eval(node.operand)
+            if isinstance(node.op, ast.UAdd): return +operand
+            if isinstance(node.op, ast.USub): return -operand
+        elif isinstance(node, ast.Num):
+            return node.n
+        else:
+            raise TypeError(f"Unsupported type: {node}")
+    parsed = ast.parse(expr, mode='eval').body
+    return _eval(parsed)
+# -------------------- AGENT CLASS --------------------
+tools = [web_search, wikipedia_search, image_recognition, read_pdf, calculate]
+class MyAgent:
+    def __init__(self):
+        from smolagents import HfApiModel
+        self.agent = ToolCallingAgent(
+            tools=tools,
+            model=HfApiModel("openai/gpt-3.5-turbo")  # or another supported model
+        )
+    def __call__(self, question: str) -> str:
+        try:
+            result = self.agent.run(question)
+            return f"FINAL ANSWER: {result.strip()}"
+        except Exception as e:
+            return f"FINAL ANSWER: ERROR - {e}"

app.py ADDED Viewed

	@@ -0,0 +1,198 @@

+import os
+import gradio as gr
+import requests
+import inspect
+import pandas as pd
+from agent import MyAgent
+# (Keep Constants as is)
+# --- Constants ---
+DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+# --- Basic Agent Definition ---
+# ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
+class BasicAgent:
+    def __init__(self):
+        print("BasicAgent initialized.")
+    def __call__(self, question: str) -> str:
+        print(f"Agent received question (first 50 chars): {question[:50]}...")
+        fixed_answer = "This is a default answer."
+        print(f"Agent returning fixed answer: {fixed_answer}")
+        return fixed_answer
+def run_and_submit_all( profile: gr.OAuthProfile | None):
+    """
+    Fetches all questions, runs the BasicAgent on them, submits all answers,
+    and displays the results.
+    """
+    # --- Determine HF Space Runtime URL and Repo URL ---
+    space_id = os.getenv("SPACE_ID") # Get the SPACE_ID for sending link to the code
+    if profile:
+        username= f"{profile.username}"
+        print(f"User logged in: {username}")
+    else:
+        print("User not logged in.")
+        return "Please Login to Hugging Face with the button.", None
+    api_url = DEFAULT_API_URL
+    questions_url = f"{api_url}/questions"
+    submit_url = f"{api_url}/submit"
+    # 1. Instantiate Agent ( modify this part to create your agent)
+    try:
+        agent = MyAgent()
+    except Exception as e:
+        print(f"Error instantiating agent: {e}")
+        return f"Error initializing agent: {e}", None
+    # In the case of an app running as a hugging Face space, this link points toward your codebase ( usefull for others so please keep it public)
+    agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
+    print(agent_code)
+    # 2. Fetch Questions
+    print(f"Fetching questions from: {questions_url}")
+    try:
+        response = requests.get(questions_url, timeout=15)
+        response.raise_for_status()
+        questions_data = response.json()
+        if not questions_data:
+             print("Fetched questions list is empty.")
+             return "Fetched questions list is empty or invalid format.", None
+        print(f"Fetched {len(questions_data)} questions.")
+    except requests.exceptions.RequestException as e:
+        print(f"Error fetching questions: {e}")
+        return f"Error fetching questions: {e}", None
+    except requests.exceptions.JSONDecodeError as e:
+         print(f"Error decoding JSON response from questions endpoint: {e}")
+         print(f"Response text: {response.text[:500]}")
+         return f"Error decoding server response for questions: {e}", None
+    except Exception as e:
+        print(f"An unexpected error occurred fetching questions: {e}")
+        return f"An unexpected error occurred fetching questions: {e}", None
+    # 3. Run your Agent
+    results_log = []
+    answers_payload = []
+    print(f"Running agent on {len(questions_data)} questions...")
+    for item in questions_data:
+        task_id = item.get("task_id")
+        question_text = item.get("question")
+        if not task_id or question_text is None:
+            print(f"Skipping item with missing task_id or question: {item}")
+            continue
+        try:
+            submitted_answer = agent(question_text)
+            answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
+            results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
+        except Exception as e:
+             print(f"Error running agent on task {task_id}: {e}")
+             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
+    if not answers_payload:
+        print("Agent did not produce any answers to submit.")
+        return "Agent did not produce any answers to submit.", pd.DataFrame(results_log)
+    # 4. Prepare Submission
+    submission_data = {"username": username.strip(), "agent_code": agent_code, "answers": answers_payload}
+    status_update = f"Agent finished. Submitting {len(answers_payload)} answers for user '{username}'..."
+    print(status_update)
+    # 5. Submit
+    print(f"Submitting {len(answers_payload)} answers to: {submit_url}")
+    try:
+        response = requests.post(submit_url, json=submission_data, timeout=60)
+        response.raise_for_status()
+        result_data = response.json()
+        final_status = (
+            f"Submission Successful!\n"
+            f"User: {result_data.get('username')}\n"
+            f"Overall Score: {result_data.get('score', 'N/A')}% "
+            f"({result_data.get('correct_count', '?')}/{result_data.get('total_attempted', '?')} correct)\n"
+            f"Message: {result_data.get('message', 'No message received.')}"
+        )
+        print("Submission successful.")
+        results_df = pd.DataFrame(results_log)
+        return final_status, results_df
+    except requests.exceptions.HTTPError as e:
+        error_detail = f"Server responded with status {e.response.status_code}."
+        try:
+            error_json = e.response.json()
+            error_detail += f" Detail: {error_json.get('detail', e.response.text)}"
+        except requests.exceptions.JSONDecodeError:
+            error_detail += f" Response: {e.response.text[:500]}"
+        status_message = f"Submission Failed: {error_detail}"
+        print(status_message)
+        results_df = pd.DataFrame(results_log)
+        return status_message, results_df
+    except requests.exceptions.Timeout:
+        status_message = "Submission Failed: The request timed out."
+        print(status_message)
+        results_df = pd.DataFrame(results_log)
+        return status_message, results_df
+    except requests.exceptions.RequestException as e:
+        status_message = f"Submission Failed: Network error - {e}"
+        print(status_message)
+        results_df = pd.DataFrame(results_log)
+        return status_message, results_df
+    except Exception as e:
+        status_message = f"An unexpected error occurred during submission: {e}"
+        print(status_message)
+        results_df = pd.DataFrame(results_log)
+        return status_message, results_df
+# --- Build Gradio Interface using Blocks ---
+with gr.Blocks() as demo:
+    gr.Markdown("# Basic Agent Evaluation Runner")
+    gr.Markdown(
+        """
+        **Instructions:**
+        1.  Please clone this space, then modify the code to define your agent's logic, the tools, the necessary packages, etc ...
+        2.  Log in to your Hugging Face account using the button below. This uses your HF username for submission.
+        3.  Click 'Run Evaluation & Submit All Answers' to fetch questions, run your agent, submit answers, and see the score.
+        ---
+        **Disclaimers:**
+        Once clicking on the "submit button, it can take quite some time ( this is the time for the agent to go through all the questions).
+        This space provides a basic setup and is intentionally sub-optimal to encourage you to develop your own, more robust solution. For instance for the delay process of the submit button, a solution could be to cache the answers and submit in a seperate action or even to answer the questions in async.
+        """
+    )
+    gr.LoginButton()
+    run_button = gr.Button("Run Evaluation & Submit All Answers")
+    status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
+    # Removed max_rows=10 from DataFrame constructor
+    results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
+    run_button.click(
+        fn=run_and_submit_all,
+        outputs=[status_output, results_table]
+    )
+if __name__ == "__main__":
+    print("\n" + "-"*30 + " App Starting " + "-"*30)
+    # Check for SPACE_HOST and SPACE_ID at startup for information
+    space_host_startup = os.getenv("SPACE_HOST")
+    space_id_startup = os.getenv("SPACE_ID") # Get SPACE_ID at startup
+    if space_host_startup:
+        print(f"✅ SPACE_HOST found: {space_host_startup}")
+        print(f"   Runtime URL should be: https://{space_host_startup}.hf.space")
+    else:
+        print("ℹ️  SPACE_HOST environment variable not found (running locally?).")
+    if space_id_startup: # Print repo URLs if SPACE_ID is found
+        print(f"✅ SPACE_ID found: {space_id_startup}")
+        print(f"   Repo URL: https://huggingface.co/spaces/{space_id_startup}")
+        print(f"   Repo Tree URL: https://huggingface.co/spaces/{space_id_startup}/tree/main")
+    else:
+        print("ℹ️  SPACE_ID environment variable not found (running locally?). Repo URL cannot be determined.")
+    print("-"*(60 + len(" App Starting ")) + "\n")
+    print("Launching Gradio Interface for Basic Agent Evaluation...")
+    demo.launch(debug=True, share=False)

metadata.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+gradio
+requests
+langchain
+langchain-community
+smolagents
+duckduckgo-search
+wikipedia
+pytesseract
+Pillow
+pymupdf

tool_counts.csv ADDED Viewed

	@@ -0,0 +1,94 @@

+Tool,Count
+Web browser,95
+Search engine,88
+Calculator,30
+Image recognition tools,11
+search engine,9
+None,9
+web browser,8
+A search engine,8
+A web browser,8
+PDF viewer,7
+PDF access,7
+Microsoft Excel,5
+Image recognition,5
+A calculator,4
+calculator,4
+OCR,4
+Web Browser,3
+Excel,3
+Color recognition,3
+Access to Wikipedia,3
+Excel file access,3
+Python,3
+A file interface,3
+Microsoft Excel / Google Sheets,3
+A web browser.,2
+Search Engine,2
+A search engine.,2
+File handling,2
+Video recognition tools,2
+Audio capability,2
+A speech-to-text tool,2
+image recognition/OCR,2
+Word document access,1
+Counter,1
+A word reversal tool / script,1
+Tool to extract text from images,1
+Python compiler,1
+Image recognition tools (to identify and parse a figure with three axes),1
+Unlambda compiler (optional),1
+A calculator.,1
+google search,1
+video recognition tools,1
+JSONLD file access,1
+Video parsing,1
+(Optional) Web browser,1
+code/data analysis tools,1
+Text processing/diff tool,1
+GIF parsing tools,1
+"Access to the Internet Archive, web.archive.org",1
+XML file access,1
+a calculator,1
+PDF reader,1
+Markdown,1
+Google Translate access,1
+Bass note data,1
+Text Editor,1
+XLSX file access,1
+PowerPoint viewer,1
+CSV file access,1
+Calculator (or use Excel),1
+(Optional) Search engine,1
+computer algebra system,1
+Video processing software,1
+Computer vision,1
+Audio processing software,1
+Google Maps,1
+Access to Excel files,1
+Calculator (or ability to count),1
+A Python IDE,1
+Spreadsheet editor,1
+No tools required,1
+Image recognition and processing tools,1
+Computer vision or OCR,1
+C++ compiler,1
+Access to Google Maps,1
+Image recognition/OCR,1
+YouTube player,1
+Natural language processor,1
+Graph interaction tools,1
+Bablyonian cuniform -> arabic legend,1
+Access to YouTube,1
+image recognition tools,1
+image search tools,1
+Calculator or counting function,1
+A speech-to-text audio processing tool,1
+Access to academic journal websites,1
+pdf reader/extracter,1
+Rubik's cube model,1
+Wikipedia,1
+Video capability,1
+Image processing tools,1
+Image recognition software,1
+YouTube,1

view_jsonfile.ipynb ADDED Viewed

	@@ -0,0 +1,381 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "d0191263",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#load in metadata.jsonl file to view it\n",
+    "import json\n",
+    "import jsonlines\n",
+    "import pandas as pd\n",
+    "import os\n",
+    "import numpy as np\n",
+    "\n",
+    "# Load the metadata.jsonl file\n",
+    "with jsonlines.open('metadata.jsonl') as reader:\n",
+    "    metadata = [obj for obj in reader]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "6820d40d",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>task_id</th>\n",
+       "      <th>Question</th>\n",
+       "      <th>Level</th>\n",
+       "      <th>Final answer</th>\n",
+       "      <th>file_name</th>\n",
+       "      <th>Annotator Metadata</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>c61d22de-5f6c-4958-a7f6-5e9707bd3466</td>\n",
+       "      <td>A paper about AI regulation that was originall...</td>\n",
+       "      <td>2</td>\n",
+       "      <td>egalitarian</td>\n",
+       "      <td></td>\n",
+       "      <td>{'Steps': '1. Go to arxiv.org and navigate to ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>17b5a6a3-bc87-42e8-b0fb-6ab0781ef2cc</td>\n",
+       "      <td>I’m researching species that became invasive a...</td>\n",
+       "      <td>2</td>\n",
+       "      <td>34689</td>\n",
+       "      <td></td>\n",
+       "      <td>{'Steps': '1. Search the web for “finding nemo...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>04a04a9b-226c-43fd-b319-d5e89743676f</td>\n",
+       "      <td>If we assume all articles published by Nature ...</td>\n",
+       "      <td>2</td>\n",
+       "      <td>41</td>\n",
+       "      <td></td>\n",
+       "      <td>{'Steps': '1. Find how many articles were publ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>14569e28-c88c-43e4-8c32-097d35b9a67d</td>\n",
+       "      <td>In Unlambda, what exact charcter or text needs...</td>\n",
+       "      <td>2</td>\n",
+       "      <td>backtick</td>\n",
+       "      <td></td>\n",
+       "      <td>{'Steps': '1. Searched \"Unlambda syntax\" onlin...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>e1fc63a2-da7a-432f-be78-7c4a95598703</td>\n",
+       "      <td>If Eliud Kipchoge could maintain his record-ma...</td>\n",
+       "      <td>1</td>\n",
+       "      <td>17</td>\n",
+       "      <td></td>\n",
+       "      <td>{'Steps': '1. Googled Eliud Kipchoge marathon ...</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                                task_id  \\\n",
+       "0  c61d22de-5f6c-4958-a7f6-5e9707bd3466   \n",
+       "1  17b5a6a3-bc87-42e8-b0fb-6ab0781ef2cc   \n",
+       "2  04a04a9b-226c-43fd-b319-d5e89743676f   \n",
+       "3  14569e28-c88c-43e4-8c32-097d35b9a67d   \n",
+       "4  e1fc63a2-da7a-432f-be78-7c4a95598703   \n",
+       "\n",
+       "                                            Question  Level Final answer  \\\n",
+       "0  A paper about AI regulation that was originall...      2  egalitarian   \n",
+       "1  I’m researching species that became invasive a...      2        34689   \n",
+       "2  If we assume all articles published by Nature ...      2           41   \n",
+       "3  In Unlambda, what exact charcter or text needs...      2     backtick   \n",
+       "4  If Eliud Kipchoge could maintain his record-ma...      1           17   \n",
+       "\n",
+       "  file_name                                 Annotator Metadata  \n",
+       "0            {'Steps': '1. Go to arxiv.org and navigate to ...  \n",
+       "1            {'Steps': '1. Search the web for “finding nemo...  \n",
+       "2            {'Steps': '1. Find how many articles were publ...  \n",
+       "3            {'Steps': '1. Searched \"Unlambda syntax\" onlin...  \n",
+       "4            {'Steps': '1. Googled Eliud Kipchoge marathon ...  "
+      ]
+     },
+     "execution_count": 5,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# Convert the list of dictionaries to a DataFrame\n",
+    "df = pd.DataFrame(metadata)\n",
+    "df.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 54,
+   "id": "9b7659b2",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'Steps': '1. Search the web for “finding nemo main character”.\\n2. Note the results, which state that the main character is a clownfish.\\n3. Search the web for “usgs nonnative species database”.\\n4. Click result for the Nonindigenous Aquatic Species site.\\n5. Click “Marine Fishes”.\\n6. Click “Species List of Nonindigenous Marine Fish”.\\n7. Scroll through the list until I find the clown anenomefish, and click “Collection info”.\\n8. Note the place that a clown anenomefish was found, in Fred Howard Park at the Gulf of Mexico.\\n9. Search the web for “fred howard park florida zip code”.\\n10. Note the zip code, 34689. Since only one clownfish was found before the year 2020, this is the answer.',\n",
+       " 'Number of steps': '10',\n",
+       " 'How long did this take?': '5 minutes',\n",
+       " 'Tools': '1. Search engine\\n2. Web browser',\n",
+       " 'Number of tools': '2'}"
+      ]
+     },
+     "execution_count": 54,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "#convert metadata into dataframe and view the annotator column\n",
+    "df = pd.DataFrame(metadata)\n",
+    "df.head()\n",
+    "df['Annotator Metadata'][1]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "54bf634a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Extract all tools from Annotator Metadata\n",
+    "all_tools = []\n",
+    "for entry in metadata:\n",
+    "    tools = entry['Annotator Metadata']['Tools'].split('\\n')\n",
+    "    # Remove numbering and leading/trailing whitespace from each tool\n",
+    "    tools = [t.split('. ')[-1].strip() for t in tools]\n",
+    "    all_tools.extend(tools)\n",
+    "\n",
+    "# Count unique tools\n",
+    "tool_counts = pd.Series(all_tools).value_counts()\n",
+    "#print out the top 10 tools with counts greater than 5 as a DataFrame\n",
+    "tool_counts_df = tool_counts.reset_index()\n",
+    "tool_counts_df.columns = ['Tool', 'Count']\n",
+    "tool_counts_df = tool_counts_df.sort_values(by='Count', ascending=False)\n",
+    "# print out unique tool names\n",
+    "# Save the tool counts to a CSV file\n",
+    "tool_counts_df.to_csv('tool_counts.csv', index=False)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1f0a65e7",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "['Web browser',\n",
+       " 'Search engine',\n",
+       " 'Calculator',\n",
+       " 'Image recognition tools',\n",
+       " 'search engine',\n",
+       " 'None',\n",
+       " 'web browser',\n",
+       " 'A search engine',\n",
+       " 'A web browser',\n",
+       " 'PDF viewer',\n",
+       " 'PDF access']"
+      ]
+     },
+     "execution_count": 37,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "tool_counts_df.Tool[tool_counts_df.Count > 5].values.tolist()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 48,
+   "id": "3674e568",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "True"
+      ]
+     },
+     "execution_count": 48,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import os\n",
+    "import requests\n",
+    "import json\n",
+    "import base64\n",
+    "  \n",
+    "import numpy as np\n",
+    "from smolagents import CodeAgent, HfApiModel, Tool\n",
+    "from langchain.agents import load_tools\n",
+    "\n",
+    "#load env variables\n",
+    "from dotenv import load_dotenv\n",
+    "load_dotenv()\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 52,
+   "id": "00f79e78",
+   "metadata": {},
+   "outputs": [
+    {
+     "ename": "PydanticUserError",
+     "evalue": "Field 'name' defined on a base class was overridden by a non-annotated attribute. All field definitions, including overrides, require a type annotation.\n\nFor further information visit https://errors.pydantic.dev/2.11/u/model-field-overridden",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[1;31mPydanticUserError\u001b[0m                         Traceback (most recent call last)",
+      "Cell \u001b[1;32mIn[52], line 38\u001b[0m\n\u001b[0;32m     31\u001b[0m wikipedia_tool \u001b[38;5;241m=\u001b[39m Tool(\n\u001b[0;32m     32\u001b[0m     name\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mWikipedia\u001b[39m\u001b[38;5;124m\"\u001b[39m,\n\u001b[0;32m     33\u001b[0m     description\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mSearch Wikipedia articles for information\u001b[39m\u001b[38;5;124m\"\u001b[39m,\n\u001b[0;32m     34\u001b[0m     func\u001b[38;5;241m=\u001b[39mwikipedia\u001b[38;5;241m.\u001b[39mrun\n\u001b[0;32m     35\u001b[0m )\n\u001b[0;32m     37\u001b[0m \u001b[38;5;66;03m# Basic Calculator Tool (free)\u001b[39;00m\n\u001b[1;32m---> 38\u001b[0m \u001b[38;5;28;01mclass\u001b[39;00m\u001b[38;5;250m \u001b[39m\u001b[38;5;21;01mCalculatorTool\u001b[39;00m(BaseTool):\n\u001b[0;32m     39\u001b[0m     name \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mCalculator\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[0;32m     40\u001b[0m     description \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mUseful for performing mathematical calculations\u001b[39m\u001b[38;5;124m\"\u001b[39m\n",
+      "File \u001b[1;32mc:\\Users\\mabel\\Anaconda3\\envs\\hf_agent\\lib\\site-packages\\pydantic\\_internal\\_model_construction.py:112\u001b[0m, in \u001b[0;36mModelMetaclass.__new__\u001b[1;34m(mcs, cls_name, bases, namespace, __pydantic_generic_metadata__, __pydantic_reset_parent_namespace__, _create_model_module, **kwargs)\u001b[0m\n\u001b[0;32m    110\u001b[0m config_wrapper \u001b[38;5;241m=\u001b[39m ConfigWrapper\u001b[38;5;241m.\u001b[39mfor_model(bases, namespace, kwargs)\n\u001b[0;32m    111\u001b[0m namespace[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmodel_config\u001b[39m\u001b[38;5;124m'\u001b[39m] \u001b[38;5;241m=\u001b[39m config_wrapper\u001b[38;5;241m.\u001b[39mconfig_dict\n\u001b[1;32m--> 112\u001b[0m private_attributes \u001b[38;5;241m=\u001b[39m \u001b[43minspect_namespace\u001b[49m\u001b[43m(\u001b[49m\n\u001b[0;32m    113\u001b[0m \u001b[43m    \u001b[49m\u001b[43mnamespace\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mconfig_wrapper\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mignored_types\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mclass_vars\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mbase_field_names\u001b[49m\n\u001b[0;32m    114\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[0;32m    115\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m private_attributes \u001b[38;5;129;01mor\u001b[39;00m base_private_attributes:\n\u001b[0;32m    116\u001b[0m     original_model_post_init \u001b[38;5;241m=\u001b[39m get_model_post_init(namespace, bases)\n",
+      "File \u001b[1;32mc:\\Users\\mabel\\Anaconda3\\envs\\hf_agent\\lib\\site-packages\\pydantic\\_internal\\_model_construction.py:449\u001b[0m, in \u001b[0;36minspect_namespace\u001b[1;34m(namespace, ignored_types, base_class_vars, base_class_fields)\u001b[0m\n\u001b[0;32m    447\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m var_name \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;129;01min\u001b[39;00m raw_annotations:\n\u001b[0;32m    448\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m var_name \u001b[38;5;129;01min\u001b[39;00m base_class_fields:\n\u001b[1;32m--> 449\u001b[0m         \u001b[38;5;28;01mraise\u001b[39;00m PydanticUserError(\n\u001b[0;32m    450\u001b[0m             \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mField \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mvar_name\u001b[38;5;132;01m!r}\u001b[39;00m\u001b[38;5;124m defined on a base class was overridden by a non-annotated attribute. \u001b[39m\u001b[38;5;124m'\u001b[39m\n\u001b[0;32m    451\u001b[0m             \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mAll field definitions, including overrides, require a type annotation.\u001b[39m\u001b[38;5;124m'\u001b[39m,\n\u001b[0;32m    452\u001b[0m             code\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmodel-field-overridden\u001b[39m\u001b[38;5;124m'\u001b[39m,\n\u001b[0;32m    453\u001b[0m         )\n\u001b[0;32m    454\u001b[0m     \u001b[38;5;28;01melif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(value, FieldInfo):\n\u001b[0;32m    455\u001b[0m         \u001b[38;5;28;01mraise\u001b[39;00m PydanticUserError(\n\u001b[0;32m    456\u001b[0m             \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mField \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mvar_name\u001b[38;5;132;01m!r}\u001b[39;00m\u001b[38;5;124m requires a type annotation\u001b[39m\u001b[38;5;124m'\u001b[39m, code\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmodel-field-missing-annotation\u001b[39m\u001b[38;5;124m'\u001b[39m\n\u001b[0;32m    457\u001b[0m         )\n",
+      "\u001b[1;31mPydanticUserError\u001b[0m: Field 'name' defined on a base class was overridden by a non-annotated attribute. All field definitions, including overrides, require a type annotation.\n\nFor further information visit https://errors.pydantic.dev/2.11/u/model-field-overridden"
+     ]
+    }
+   ],
+   "source": [
+    "# build tools for the agent with the following functions: websearch,calculator,Image recognition tools, image viewer, pdf viewer, pdf accesser\n",
+    "# use langchain and other libraries to build the tools\n",
+    "\n",
+    "from smolagents import CodeAgent, HfApiModel, Tool\n",
+    "from langchain.agents import load_tools\n",
+    "from langchain.tools import Tool as LangchainTool\n",
+    "\n",
+    "# Import required libraries\n",
+    "from langchain.tools import DuckDuckGoSearchRun\n",
+    "from langchain.utilities import WikipediaAPIWrapper\n",
+    "from langchain.tools import BaseTool\n",
+    "from langchain.callbacks.manager import CallbackManagerForToolRun\n",
+    "from typing import Optional, Type\n",
+    "from langchain.tools import ShellTool\n",
+    "from PIL import Image\n",
+    "import pytesseract\n",
+    "import requests\n",
+    "from io import BytesIO\n",
+    "import fitz  # PyMuPDF for PDF handling\n",
+    "\n",
+    "# Web Search Tool using DuckDuckGo (free)\n",
+    "search = DuckDuckGoSearchRun()\n",
+    "web_search_tool = Tool(\n",
+    "    name=\"Web Search\",\n",
+    "    description=\"Search the web for current information using DuckDuckGo\",\n",
+    "    func=search.run\n",
+    ")\n",
+    "\n",
+    "# Wikipedia Tool (free)\n",
+    "wikipedia = WikipediaAPIWrapper()\n",
+    "wikipedia_tool = Tool(\n",
+    "    name=\"Wikipedia\",\n",
+    "    description=\"Search Wikipedia articles for information\",\n",
+    "    func=wikipedia.run\n",
+    ")\n",
+    "\n",
+    "# Basic Calculator Tool (free)\n",
+    "class CalculatorTool(BaseTool):\n",
+    "    name = \"Calculator\"\n",
+    "    description = \"Useful for performing mathematical calculations\"\n",
+    "    \n",
+    "    def _run(self, query: str, run_manager: Optional[CallbackManagerForToolRun] = None) -> str:\n",
+    "        client = wolframalpha.Client(WOLFRAM_ALPHA_APPID)\n",
+    "        res = client.query(query)\n",
+    "        return next(res.results).text\n",
+    "\n",
+    "# Image Recognition Tool (using local Tesseract OCR)\n",
+    "class ImageRecognitionTool(BaseTool):\n",
+    "    name = \"Image Recognition\"\n",
+    "    description = \"Analyze and extract text from images using OCR\"\n",
+    "    \n",
+    "    def _run(self, image_path: str, run_manager: Optional[CallbackManagerForToolRun] = None) -> str:\n",
+    "        try:\n",
+    "            img = Image.open(image_path)\n",
+    "            text = pytesseract.image_to_string(img)\n",
+    "            return text\n",
+    "        except Exception as e:\n",
+    "            return f\"Error processing image: {str(e)}\"\n",
+    "\n",
+    "# PDF Reader Tool\n",
+    "class PDFReaderTool(BaseTool):\n",
+    "    name = \"PDF Reader\"\n",
+    "    description = \"Read and extract text from PDF documents\"\n",
+    "    \n",
+    "    def _run(self, pdf_path: str, run_manager: Optional[CallbackManagerForToolRun] = None) -> str:\n",
+    "        try:\n",
+    "            doc = fitz.open(pdf_path)\n",
+    "            text = \"\"\n",
+    "            for page in doc:\n",
+    "                text += page.get_text()\n",
+    "            return text\n",
+    "        except Exception as e:\n",
+    "            return f\"Error reading PDF: {str(e)}\"\n",
+    "\n",
+    "\n",
+    "\n",
+    "# Test the agent (uncomment to run)\n",
+    "# response = agent.run(\"Calculate 234 * 789 and then search for information about the result\")\n"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "hf_agent",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.17"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}