Final_Assignment_Template

Running

App Files Files Community

polyMoe commited on 11 days ago

Commit

f8999dc

verified ·

1 Parent(s): 98d55d6

Update app.py

Browse files

implémentation des caches :
- cache des questions déjà récupérées
- cache des réponses déjà obtenues

Files changed (1) hide show

app.py +104 -27

app.py CHANGED Viewed

@@ -3,6 +3,7 @@ import gradio as gr
 import requests
 import inspect
 import pandas as pd
 # (Keep Constants as is)
 # --- Constants ---
@@ -48,44 +49,120 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
     print(agent_code)
-    # 2. Fetch Questions
-    print(f"Fetching questions from: {questions_url}")
-    try:
-        response = requests.get(questions_url, timeout=15)
-        response.raise_for_status()
-        questions_data = response.json()
-        if not questions_data:
-             print("Fetched questions list is empty.")
-             return "Fetched questions list is empty or invalid format.", None
-        print(f"Fetched {len(questions_data)} questions.")
-    except requests.exceptions.RequestException as e:
-        print(f"Error fetching questions: {e}")
-        return f"Error fetching questions: {e}", None
-    except requests.exceptions.JSONDecodeError as e:
-         print(f"Error decoding JSON response from questions endpoint: {e}")
-         print(f"Response text: {response.text[:500]}")
-         return f"Error decoding server response for questions: {e}", None
-    except Exception as e:
-        print(f"An unexpected error occurred fetching questions: {e}")
-        return f"An unexpected error occurred fetching questions: {e}", None
-    # 3. Run your Agent
     results_log = []
     answers_payload = []
     print(f"Running agent on {len(questions_data)} questions...")
     for item in questions_data:
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id or question_text is None:
             print(f"Skipping item with missing task_id or question: {item}")
             continue
         try:
-            submitted_answer = agent(question_text)
-            answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
-            results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
-        except Exception as e:
-             print(f"Error running agent on task {task_id}: {e}")
-             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
     if not answers_payload:
         print("Agent did not produce any answers to submit.")

 import requests
 import inspect
 import pandas as pd
+import json
 # (Keep Constants as is)
 # --- Constants ---
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
     print(agent_code)
+    # 2. Load Questions (cache first, API fallback)
+    cache_path = os.path.join(os.path.dirname(__file__), "cached_questions.json")
+    questions_data = None
+    # 2.a Try cache first
+    if os.path.exists(cache_path):
+        try:
+            with open(cache_path, "r", encoding="utf-8") as f:
+                cached = json.load(f)
+            if isinstance(cached, list) and cached:
+                questions_data = cached
+                print(f"Loaded {len(questions_data)} questions from cache: {cache_path}")
+            else:
+                print(f"Cache file found but empty/invalid format: {cache_path}")
+        except json.JSONDecodeError as e:
+            print(f"Cache JSON is invalid ({cache_path}): {e}. Falling back to API.")
+        except OSError as e:
+            print(f"Could not read cache file ({cache_path}): {e}. Falling back to API.")
+    # 2.b Fetch from API only if cache missing/invalid/empty
+    if questions_data is None:
+        print(f"Fetching questions from: {questions_url}")
+        try:
+            response = requests.get(questions_url, timeout=15)
+            response.raise_for_status()
+            questions_data = response.json()
+            if not isinstance(questions_data, list) or not questions_data:
+                print("Fetched questions list is empty or invalid format.")
+                return "Fetched questions list is empty or invalid format.", None
+            print(f"Fetched {len(questions_data)} questions from API.")
+            # Save cache for next runs
+            try:
+                with open(cache_path, "w", encoding="utf-8") as f:
+                    json.dump(questions_data, f, ensure_ascii=False, indent=2)
+                print(f"Questions cached to: {cache_path}")
+            except OSError as e:
+                print(f"Warning: unable to write cache file ({cache_path}): {e}")
+        except requests.exceptions.RequestException as e:
+            print(f"Error fetching questions: {e}")
+            return f"Error fetching questions: {e}", None
+        except requests.exceptions.JSONDecodeError as e:
+            print(f"Error decoding JSON response from questions endpoint: {e}")
+            print(f"Response text: {response.text[:500]}")
+            return f"Error decoding server response for questions: {e}", None
+        except Exception as e:
+            print(f"An unexpected error occurred fetching questions: {e}")
+            return f"An unexpected error occurred fetching questions: {e}", None
+    # 3. Run your Agent (answers cache by task_id)
     results_log = []
     answers_payload = []
+    answers_cache_path = os.path.join(os.path.dirname(__file__), "cached_answers.json")
+    answers_cache = {}
+    # 3.a Load answers cache
+    if os.path.exists(answers_cache_path):
+        try:
+            with open(answers_cache_path, "r", encoding="utf-8") as f:
+                loaded_cache = json.load(f)
+            if isinstance(loaded_cache, dict):
+                answers_cache = loaded_cache
+                print(f"Loaded {len(answers_cache)} cached answers from: {answers_cache_path}")
+            else:
+                print(f"Answers cache has invalid format (expected object): {answers_cache_path}")
+        except json.JSONDecodeError as e:
+            print(f"Answers cache JSON is invalid ({answers_cache_path}): {e}. Starting with empty cache.")
+        except OSError as e:
+            print(f"Could not read answers cache ({answers_cache_path}): {e}. Starting with empty cache.")
+    cache_updated = False
     print(f"Running agent on {len(questions_data)} questions...")
     for item in questions_data:
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id or question_text is None:
             print(f"Skipping item with missing task_id or question: {item}")
             continue
+        task_key = str(task_id)
+        # Use cached answer if available
+        if task_key in answers_cache:
+            submitted_answer = answers_cache[task_key]
+            print(f"Using cached answer for task_id={task_id}")
+        else:
+            try:
+                submitted_answer = agent(question_text)
+                answers_cache[task_key] = submitted_answer
+                cache_updated = True
+                print(f"Computed and cached answer for task_id={task_id}")
+            except Exception as e:
+                print(f"Error running agent on task {task_id}: {e}")
+                results_log.append(
+                    {"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
+                continue
+        answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
+        results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
+    # 3.b Save answers cache only if updated
+    if cache_updated:
         try:
+            with open(answers_cache_path, "w", encoding="utf-8") as f:
+                json.dump(answers_cache, f, ensure_ascii=False, indent=2)
+            print(f"Answers cache updated: {answers_cache_path}")
+        except OSError as e:
+            print(f"Warning: unable to write answers cache ({answers_cache_path}): {e}")
     if not answers_payload:
         print("Agent did not produce any answers to submit.")