Spaces:

Yooshiii
/

CodeSense

Running

App Files Files Community

CodeSense / merge_server.py

Yooshiii

Update merge_server.py

772d13a verified 9 days ago

raw

history blame contribute delete

34.1 kB

	import os
	import pickle
	import torch
	import numpy as np
	import ast
	from flask import Flask, request, jsonify
	from transformers import AutoTokenizer, AutoModel

	# --- IMPORT ETHAN'S HYBRID ENGINE (Checker 1 & 2) ---
	from codesense.analyzer import analyze_code

	app = Flask(__name__)

	# --- CONFIG ---
	MODEL_FILE = 'NEW_BRAIN_MLP.pk2'
	base_dir = os.path.dirname(os.path.abspath(__file__))
	model_path = os.path.join(base_dir, MODEL_FILE)

	print("⏳ Booting up CodeSense Triple-Checker System...")
	print("⏳ Loading Checker 1 & 2: AST Rule-Engine + CodeT5...")

	# --- LOAD YOUR SAFETY NET (Checker 3: CodeBERT + pk2) ---
	try:
	print(f"📂 Loading Checker 3: CodeBERT Safety Net ({MODEL_FILE})...")
	tokenizer = AutoTokenizer.from_pretrained("microsoft/codebert-base")
	codebert = AutoModel.from_pretrained("microsoft/codebert-base")

	with open(model_path, 'rb') as f:
	classifier = pickle.load(f)
	print("✅ All 3 AI Brains Loaded! Server Ready on Port 5000.")
	except Exception as e:
	print(f"❌ WARNING: Could not load Safety Net. {e}")
	classifier = None

	def get_vector(code):
	inputs = tokenizer(code, return_tensors="pt", truncation=True, max_length=512, padding=True)
	with torch.no_grad():
	outputs = codebert(**inputs)
	return outputs.last_hidden_state[:, 0, :].numpy().flatten()


	# --- YOUR MAGIC VARIABLE EXTRACTOR & AST LOOP COUNTER ---
	class CodeAnalyzer(ast.NodeVisitor):
	def __init__(self):
	self.max_loop_depth = 0
	self.current_loop_depth = 0
	self.func_name = "optimized_function"
	self.args_string = "data"
	self.first_arg = "data"

	def visit_FunctionDef(self, node):
	self.func_name = node.name
	arg_names = [arg.arg for arg in node.args.args]
	if arg_names:
	self.args_string = ", ".join(arg_names)
	self.first_arg = arg_names[0]
	self.generic_visit(node)

	def visit_For(self, node):
	self.current_loop_depth += 1
	if self.current_loop_depth > self.max_loop_depth:
	self.max_loop_depth = self.current_loop_depth
	self.generic_visit(node)
	self.current_loop_depth -= 1

	def visit_While(self, node):
	self.current_loop_depth += 1
	if self.current_loop_depth > self.max_loop_depth:
	self.max_loop_depth = self.current_loop_depth
	self.generic_visit(node)
	self.current_loop_depth -= 1


	# --- API ROUTE ---
	@app.route('/predict', methods=['POST'])
	def predict():
	data = request.json
	code = data.get('code', '')
	if not code: return jsonify({"error": "No code provided"}), 400

	try:
	# 1. Extract your variables & Count Loops
	analyzer = CodeAnalyzer()
	try:
	tree = ast.parse(code)
	analyzer.visit(tree)

	# --- CALCULATE TIME COMPLEXITY USING AST ---
	loop_depth = analyzer.max_loop_depth
	if loop_depth == 0: dynamic_comp = "O(1) (No loops)"
	elif loop_depth == 1: dynamic_comp = "O(n) (Linear)"
	elif loop_depth == 2: dynamic_comp = "O(n^2) (Nested loops)"
	else: dynamic_comp = f"O(n^{loop_depth}) (Deeply nested)"

	except Exception:
	dynamic_comp = "Error parsing code structure"

	# ==========================================
	# 🛡️ THE TRIPLE-CHECKER LOGIC
	# ==========================================

	# Run Ethan's Engine
	analysis_result = analyze_code(code)

	algo = analysis_result.get("pattern", "Unknown")
	ethan_summary = analysis_result.get("summary", "")
	t5_raw_conf = analysis_result.get("ml_insights", {}).get("confidence", 0.0)

	final_conf = t5_raw_conf
	safety_net_triggered = False

	# Patterns that mean the first engine is slightly confused
	GENERIC_PATTERNS = ["Unknown", "Nested Iterative", "Linear Iterative", "Recursive (Linear)", "Recursive (Exponential)"]

	# If AST/CodeT5 is confused, trigger YOUR CodeBERT model!
	if (algo in GENERIC_PATTERNS or t5_raw_conf < 0.90) and classifier is not None:
	print(f"⚠️ Primary engine unsure (Confidence: {t5_raw_conf:.2f}). Triggering CodeBERT Safety Net...")

	try:
	vector = get_vector(code)
	bert_pred = classifier.predict([vector])[0]

	try:
	bert_probs = classifier.predict_proba([vector])[0]
	bert_conf = float(max(bert_probs))
	except:
	bert_conf = 0.85

	if bert_conf >= 0.80:
	algo = bert_pred
	final_conf = bert_conf
	safety_net_triggered = True
	print(f"🛡️ Safety Net Override Successful: {algo} ({bert_conf*100:.1f}%)")
	except Exception as e:
	print(f"Safety Net Error: {e}")

	conf_percentage = (final_conf * 100) if final_conf else 100.0

	# ==========================================
	# 📚 YOUR FULL UI DICTIONARY
	# ==========================================
	complexity_map = {
	# --- SORTING ---
	"Bubble Sort": {
	"space": "O(1)",
	"explanation": "⚠️ CRITICAL: Bubble Sort is inefficient (O(n^2)) for large datasets. Refactor to Quick Sort or Merge Sort (O(n log n)).",
	"improvements": ["Added a 'swapped' flag to exit early if sorted.", "Shrink inner loop by 'i' each pass."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n n = len([FIRST_ARG])\n for i in range(n):\n swapped = False\n for j in range(0, n - i - 1):\n if [FIRST_ARG][j] > [FIRST_ARG][j + 1]:\n [FIRST_ARG][j], [FIRST_ARG][j + 1] = [FIRST_ARG][j + 1], [FIRST_ARG][j]\n swapped = True\n if not swapped: break\n return [FIRST_ARG]",
	"recommended_name": "Quick Sort OR Merge Sort (O(n log n))",
	"recommended_code": "# --- OPTION 1: QUICK SORT ---\nimport random\ndef [FUNC_NAME]_quicksort([ARGS]):\n if len([FIRST_ARG]) <= 1: return [FIRST_ARG]\n pivot = random.choice([FIRST_ARG])\n L = [x for x in [FIRST_ARG] if x < pivot]\n M = [x for x in [FIRST_ARG] if x == pivot]\n R = [x for x in [FIRST_ARG] if x > pivot]\n return [FUNC_NAME]_quicksort(L) + M + [FUNC_NAME]_quicksort(R)\n\n# --- OPTION 2: BUILT-IN SORT ---\ndef [FUNC_NAME]_timsort([ARGS]):\n return sorted([FIRST_ARG])"
	},
	"Insertion Sort": {
	"space": "O(1)",
	"explanation": "⚠️ WARNING: Insertion Sort is slow (O(n^2)) for large lists. It is okay for small inputs (<50 items), but consider Quick Sort for scalability.",
	"improvements": ["Your logic is correct for small datasets, but fails to scale.", "For >50 items, pivot to a divide-and-conquer approach."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n for i in range(1, len([FIRST_ARG])):\n key = [FIRST_ARG][i]\n j = i - 1\n while j >= 0 and key < [FIRST_ARG][j]:\n [FIRST_ARG][j + 1] = [FIRST_ARG][j]\n j -= 1\n [FIRST_ARG][j + 1] = key\n return [FIRST_ARG]",
	"recommended_name": "Quick Sort OR Merge Sort (O(n log n))",
	"recommended_code": "# --- OPTION 1: QUICK SORT ---\ndef [FUNC_NAME]_quicksort([ARGS]):\n if len([FIRST_ARG]) <= 1: return [FIRST_ARG]\n pivot = [FIRST_ARG][len([FIRST_ARG]) // 2]\n return [FUNC_NAME]_quicksort([x for x in [FIRST_ARG] if x < pivot]) + \\\n [x for x in [FIRST_ARG] if x == pivot] + \\\n [FUNC_NAME]_quicksort([x for x in [FIRST_ARG] if x > pivot])"
	},
	"Hash Map Lookup": {
	"space": "O(n)",
	"explanation": "✅ GOOD: Uses a dictionary (Hash Map) for instant O(1) lookups instead of repeatedly searching through a list. This drops the time complexity from O(n^2) down to a highly efficient O(n).",
	"improvements": ["You are correctly using a dictionary to map elements.", "This trades a small amount of memory O(n) for a massive speedup O(1) per lookup."],
	"optimized_code": "def [FUNC_NAME]([ARGS], target):\n seen = {}\n for i, val in enumerate([FIRST_ARG]):\n needed = target - val\n if needed in seen:\n return [seen[needed], i]\n seen[val] = i\n return []"
	},
	"Selection Sort": {
	"space": "O(1)",
	"explanation": "⚠️ WARNING: Selection Sort is always O(n^2), even if the list is sorted. Switch to Insertion Sort (for small lists) or Merge Sort.",
	"improvements": ["Avoid this algorithm entirely for production code.", "Replace with an algorithm that adapts to already-sorted data."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n for i in range(len([FIRST_ARG])):\n min_idx = i\n for j in range(i+1, len([FIRST_ARG])):\n if [FIRST_ARG][j] < [FIRST_ARG][min_idx]:\n min_idx = j\n [FIRST_ARG][i], [FIRST_ARG][min_idx] = [FIRST_ARG][min_idx], [FIRST_ARG][i]\n return [FIRST_ARG]",
	"recommended_name": "Insertion Sort OR Merge Sort",
	"recommended_code": "# --- OPTION 1: INSERTION SORT ---\ndef [FUNC_NAME]_insertion([ARGS]):\n for i in range(1, len([FIRST_ARG])):\n key = [FIRST_ARG][i]\n j = i - 1\n while j >= 0 and key < [FIRST_ARG][j]:\n [FIRST_ARG][j + 1] = [FIRST_ARG][j]\n j -= 1\n [FIRST_ARG][j + 1] = key\n return [FIRST_ARG]"
	},
	"Quick Sort": {
	"space": "O(log n)",
	"explanation": "✅ EXCELLENT: Quick Sort is a standard, efficient O(n log n) algorithm. Ensure you handle the worst-case pivot selection.",
	"improvements": ["Ensure your pivot is chosen randomly instead of always picking the first or last element."],
	"optimized_code": "import random\ndef [FUNC_NAME]([ARGS]):\n if len([FIRST_ARG]) <= 1: return [FIRST_ARG]\n pivot = random.choice([FIRST_ARG])\n left = [x for x in [FIRST_ARG] if x < pivot]\n middle = [x for x in [FIRST_ARG] if x == pivot]\n right = [x for x in [FIRST_ARG] if x > pivot]\n return [FUNC_NAME](left) + middle + [FUNC_NAME](right)"
	},
	"Merge Sort": {
	"space": "O(n)",
	"explanation": "✅ EXCELLENT: Merge Sort is stable and consistent O(n log n). Great for large datasets.",
	"improvements": ["Your algorithm is optimal for time complexity.", "Be aware that Merge Sort uses O(n) extra memory."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n if len([FIRST_ARG]) > 1:\n mid = len([FIRST_ARG]) // 2\n L, R = [FIRST_ARG][:mid], [FIRST_ARG][mid:]\n [FUNC_NAME](L)\n [FUNC_NAME](R)\n i = j = k = 0\n while i < len(L) and j < len(R):\n if L[i] < R[j]:\n [FIRST_ARG][k] = L[i]\n i += 1\n else:\n [FIRST_ARG][k] = R[j]\n j += 1\n k += 1\n while i < len(L):\n [FIRST_ARG][k] = L[i]\n i, k = i + 1, k + 1\n while j < len(R):\n [FIRST_ARG][k] = R[j]\n j, k = j + 1, k + 1\n return [FIRST_ARG]"
	},
	"Heap Sort": {
	"space": "O(1)",
	"explanation": "✅ GOOD: Heap Sort is memory efficient (O(1) extra space) and fast (O(n log n)).",
	"improvements": ["Use Python's built-in `heapq` library for C-level optimization."],
	"optimized_code": "import heapq\ndef [FUNC_NAME]([ARGS]):\n heapq.heapify([FIRST_ARG])\n return [heapq.heappop([FIRST_ARG]) for _ in range(len([FIRST_ARG]))]"
	},
	"Counting Sort": {
	"space": "O(n + k)",
	"explanation": "✅ EFFICIENT: Very fast (O(n+k)) for integers with a small range. Not suitable for strings or large ranges.",
	"improvements": ["Ensure your data strictly contains integers with a known maximum value."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n if not [FIRST_ARG]: return [FIRST_ARG]\n max_val = max([FIRST_ARG])\n count = [0] * (max_val + 1)\n for num in [FIRST_ARG]: count[num] += 1\n idx = 0\n for i in range(len(count)):\n while count[i] > 0:\n [FIRST_ARG][idx] = i\n idx += 1\n count[i] -= 1\n return [FIRST_ARG]"
	},

	# --- SEARCHING ---
	"Linear Search": {
	"space": "O(1)",
	"explanation": "⚠️ INEFFICIENT: iterating through every item is O(n). If your data is sorted, switch to Binary Search (O(log n)) for a massive speedup.",
	"improvements": ["Only checking items one by one requires O(n) time.", "If your data is sorted, use Binary Search."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n for i in range(len([FIRST_ARG])):\n if [FIRST_ARG][i] == target: return i # Target must be passed\n return -1",
	"recommended_name": "Binary Search (O(log n))",
	"recommended_code": "import bisect\ndef [FUNC_NAME]_binary([ARGS]):\n # Assuming [FIRST_ARG] is sorted\n idx = bisect.bisect_left([FIRST_ARG], target)\n if idx < len([FIRST_ARG]) and [FIRST_ARG][idx] == target:\n return idx\n return -1"
	},
	"Binary Search": {
	"space": "O(1)",
	"explanation": "✅ PERFECT: Binary Search is the gold standard (O(log n)) for sorted arrays.",
	"improvements": ["Ensure your array is sorted first.", "You can manually write it with a while loop, or use Python's built in `bisect` library."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n # Manual implementation\n left, right = 0, len([FIRST_ARG]) - 1\n while left <= right:\n mid = (left + right) // 2\n if [FIRST_ARG][mid] == target: return mid\n elif [FIRST_ARG][mid] < target: left = mid + 1\n else: right = mid - 1\n return -1"
	},
	"Jump Search": {
	"space": "O(1)",
	"explanation": "✅ GOOD: Jump Search (O(√n)) is better than Linear Search, but Binary Search is still faster if random access is allowed.",
	"improvements": ["If you are using standard lists, switch to Binary Search (O(log n))."],
	"optimized_code": "import math\ndef [FUNC_NAME]([ARGS]):\n n = len([FIRST_ARG])\n step = int(math.sqrt(n))\n prev = 0\n while [FIRST_ARG][min(step, n)-1] < target:\n prev = step\n step += int(math.sqrt(n))\n if prev >= n: return -1\n while [FIRST_ARG][prev] < target:\n prev += 1\n if prev == min(step, n): return -1\n if [FIRST_ARG][prev] == target: return prev\n return -1",
	"recommended_name": "Binary Search (O(log n))",
	"recommended_code": "import bisect\ndef [FUNC_NAME]_binary([ARGS]):\n idx = bisect.bisect_left([FIRST_ARG], target)\n if idx < len([FIRST_ARG]) and [FIRST_ARG][idx] == target:\n return idx\n return -1"
	},
	"Nested Iterative": {
	"space": "O(1)",
	"explanation": "⚠️ WARNING: Nested loops usually indicate a 'brute force' O(n^2) time complexity. This scales poorly for large datasets and can often be optimized.",
	"improvements": ["Check if the inner loop can be replaced with a Hash Map (dictionary) for O(1) lookups.", "If analyzing contiguous subarrays, switch to the Sliding Window technique (O(n))."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n n = len([FIRST_ARG])\n # If you MUST use nested loops, ensure the inner loop shrinks each pass (j = i + 1)\n for i in range(n):\n for j in range(i + 1, n):\n pass # Your logic here\n return [FIRST_ARG]",
	"recommended_name": "Hash Map Lookup OR Sliding Window (O(n))",
	"recommended_code": "# --- OPTION 1: HASH MAP (For finding pairs/duplicates) ---\ndef [FUNC_NAME]_hashmap([ARGS]):\n seen = set()\n for item in [FIRST_ARG]:\n if item in seen: return item\n seen.add(item)\n return [FIRST_ARG]\n\n# --- OPTION 2: SLIDING WINDOW (For subarrays) ---\ndef [FUNC_NAME]_window([ARGS], k=2):\n # Assumes [FIRST_ARG] is a list of numbers\n window_sum = sum([FIRST_ARG][:k])\n for i in range(len([FIRST_ARG]) - k):\n window_sum = window_sum - [FIRST_ARG][i] + [FIRST_ARG][i+k]\n return window_sum"
	},
	# --- RECURSION, DP, & MATH ---
	"Fibonacci Sequence": {
	"space": "O(n)",
	"explanation": "⚠️ RECURSION ALERT: Simple recursive Fibonacci is O(2^n) (Exponential). Refactor to use Dynamic Programming (Memoization) or an Iterative Loop to make it O(n).",
	"improvements": ["Recursion causes stack overflow risks."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n if [FIRST_ARG] <= 0: return 0\n if [FIRST_ARG] == 1: return 1\n return [FUNC_NAME]([FIRST_ARG]-1) + [FUNC_NAME]([FIRST_ARG]-2)",
	"recommended_name": "Iterative OR Memoized Fibonacci (O(n))",
	"recommended_code": "# --- OPTION 1: ITERATIVE (O(1) Space) ---\ndef [FUNC_NAME]_iterative([ARGS]):\n if [FIRST_ARG] <= 0: return 0\n if [FIRST_ARG] == 1: return 1\n a, b = 0, 1\n for _ in range(2, [FIRST_ARG] + 1):\n a, b = b, a + b\n return b\n\n# --- OPTION 2: MEMOIZATION (Caching) ---\nfrom functools import lru_cache\n@lru_cache(maxsize=None)\ndef [FUNC_NAME]_memoized([ARGS]):\n if [FIRST_ARG] <= 1: return [FIRST_ARG]\n return [FUNC_NAME]_memoized([FIRST_ARG]-1) + [FUNC_NAME]_memoized([FIRST_ARG]-2)"
	},
	"Memoization": {
	"space": "O(n)",
	"explanation": "✅ EFFICIENT: You successfully applied Memoization (Top-Down DP) to prevent redundant calculations.",
	"improvements": ["Caching results prevents the O(2^n) exponential blow-up of standard recursion."],
	"optimized_code": "memo = {}\ndef [FUNC_NAME]([ARGS]):\n if [FIRST_ARG] in memo: return memo[[FIRST_ARG]]\n if [FIRST_ARG] <= 1: return [FIRST_ARG]\n memo[[FIRST_ARG]] = [FUNC_NAME]([FIRST_ARG]-1) + [FUNC_NAME]([FIRST_ARG]-2)\n return memo[[FIRST_ARG]]"
	},
	"Tabulation": {
	"space": "O(n)",
	"explanation": "✅ EFFICIENT: You successfully applied Tabulation (Bottom-Up DP) to prevent recursion stack overflow limits.",
	"improvements": ["Iteratively building the table is memory safe and prevents RecursionError."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n if [FIRST_ARG] <= 0: return 0\n dp = [0] * ([FIRST_ARG] + 1)\n dp[1] = 1\n for i in range(2, [FIRST_ARG] + 1):\n dp[i] = dp[i-1] + dp[i-2]\n return dp[[FIRST_ARG]]"
	},
	"Factorial (Recursive)": {
	"space": "O(n)",
	"explanation": "⚠️ STACK RISK: Recursive Factorial works, but large inputs will cause a `RecursionError`. Use an Iterative Loop for safety.",
	"improvements": ["Use a `for` loop to accumulate the result instead of recursion.", "Better yet, use Python's built in `math.factorial()`."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n if [FIRST_ARG] == 1 or [FIRST_ARG] == 0: return 1\n return [FIRST_ARG] * [FUNC_NAME]([FIRST_ARG] - 1)",
	"recommended_name": "Iterative Factorial (O(n))",
	"recommended_code": "import math\ndef [FUNC_NAME]_safe([ARGS]):\n # Built-in math functions run in C and avoid RecursionErrors\n return math.factorial([FIRST_ARG])"
	},
	"Factorial (Iterative)": {
	"space": "O(1)",
	"explanation": "✅ GOOD: Iterative Factorial is safe and efficient (O(n)).",
	"improvements": ["Your logic is solid, but you can achieve even faster execution using the built-in math module."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n result = 1\n for i in range(2, [FIRST_ARG] + 1):\n result *= i\n return result"
	},
	"Prime Check": {
	"space": "O(1)",
	"explanation": "✅ EFFICIENT: This O(√n) approach is much faster than checking all numbers up to N.",
	"improvements": ["Ensure your loop stops at the square root of n.", "Handle edge cases for 1, 2, and 3 explicitly."],
	"optimized_code": "import math\ndef [FUNC_NAME]([ARGS]):\n if [FIRST_ARG] <= 1: return False\n if [FIRST_ARG] in (2, 3): return True\n if [FIRST_ARG] % 2 == 0 or [FIRST_ARG] % 3 == 0: return False\n for i in range(5, int(math.sqrt([FIRST_ARG])) + 1, 6):\n if [FIRST_ARG] % i == 0 or [FIRST_ARG] % (i + 2) == 0: return False\n return True"
	},
	"GCD (Euclidean)": {
	"space": "O(1)",
	"explanation": "✅ PERFECT: Euclidean algorithm is the most efficient way to find GCD.",
	"improvements": ["Use Python's built-in `math.gcd` for cleaner and slightly faster code."],
	"optimized_code": "def [FUNC_NAME](a, b):\n while b:\n a, b = b, a % b\n return abs(a)"
	},
	"Palindrome Check": {
	"space": "O(1)",
	"explanation": "✅ GOOD: O(n) is the optimal complexity for checking palindromes.",
	"improvements": ["In Python, slicing is often faster than setting up a while loop with two pointers."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n return str([FIRST_ARG]) == str([FIRST_ARG])[::-1]"
	},
	"Armstrong Number": {
	"space": "O(log n)",
	"explanation": "✅ GOOD: Analyzing digits is O(log n), which is optimal.",
	"improvements": ["Convert the number to a string to easily iterate over the digits."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n digits = str([FIRST_ARG])\n power = len(digits)\n return [FIRST_ARG] == sum(int(d)**power for d in digits)"
	},

	# --- GRAPHS, POINTERS, & DATA STRUCTURES ---
	"Dijkstra's Algorithm": {
	"space": "O(V)",
	"explanation": "✅ INDUSTRY STANDARD: Best for finding shortest paths in weighted graphs.",
	"improvements": ["Ensure you are using a Priority Queue (`heapq`) to achieve O(E log V) time complexity."],
	"optimized_code": "import heapq\ndef [FUNC_NAME](graph, start):\n distances = {node: float('inf') for node in graph}\n distances[start] = 0\n pq = [(0, start)]\n while pq:\n curr_dist, curr_node = heapq.heappop(pq)\n if curr_dist > distances[curr_node]: continue\n for neighbor, weight in graph[curr_node].items():\n dist = curr_dist + weight\n if dist < distances[neighbor]:\n distances[neighbor] = dist\n heapq.heappush(pq, (dist, neighbor))\n return distances"
	},
	"Heap-Based Algorithm": {
	"space": "O(N)",
	"explanation": "✅ GOOD: Ideal for dynamically finding the top K elements (smallest/largest), scheduling tasks, or building priority queues without sorting the whole list.",
	"improvements": ["Always use Python's built-in `heapq` module instead of manually sorting arrays with `.sort()`.", "Use `heapq.heapify()` to build your initial heap in O(N) time instead of pushing items one-by-one."],
	"optimized_code": "import heapq\n\ndef [FUNC_NAME](data, k):\n # O(N) time to build the heap in-place\n heapq.heapify(data)\n # Extract the k smallest elements efficiently\n result = [heapq.heappop(data) for _ in range(k)]\n return result"
	},
	"Breadth-First Search": {
	"space": "O(V)",
	"explanation": "✅ GOOD: Perfect for shortest paths in unweighted graphs or level-order traversal.",
	"improvements": ["Always use `collections.deque` for the queue instead of a standard list."],
	"optimized_code": "from collections import deque\ndef [FUNC_NAME](graph, start):\n visited = set([start])\n queue = deque([start])\n result = []\n while queue:\n node = queue.popleft()\n result.append(node)\n for neighbor in graph[node]:\n if neighbor not in visited:\n visited.add(neighbor)\n queue.append(neighbor)\n return result"
	},
	"BFS (Graph)": {
	"space": "O(V)",
	"explanation": "✅ GOOD: Perfect for shortest paths in unweighted graphs or level-order traversal.",
	"improvements": ["Always use `collections.deque` for the queue instead of a standard list."],
	"optimized_code": "from collections import deque\ndef [FUNC_NAME](graph, start):\n visited = set([start])\n queue = deque([start])\n result = []\n while queue:\n node = queue.popleft()\n result.append(node)\n for neighbor in graph[node]:\n if neighbor not in visited:\n visited.add(neighbor)\n queue.append(neighbor)\n return result"
	},
	"Depth-First Search": {
	"space": "O(V)",
	"explanation": "✅ GOOD: Standard for pathfinding puzzles, topological sorting, and cycle detection.",
	"improvements": ["If recursion depth is a concern, switch to an iterative DFS using a stack."],
	"optimized_code": "def [FUNC_NAME](graph, start, visited=None):\n if visited is None: visited = set()\n visited.add(start)\n # Process node here\n for neighbor in graph[start]:\n if neighbor not in visited:\n [FUNC_NAME](graph, neighbor, visited)\n return visited"
	},
	"DFS (Graph)": {
	"space": "O(V)",
	"explanation": "✅ GOOD: Standard for pathfinding puzzles, topological sorting, and cycle detection.",
	"improvements": ["If recursion depth is a concern, switch to an iterative DFS using a stack."],
	"optimized_code": "def [FUNC_NAME](graph, start, visited=None):\n if visited is None: visited = set()\n visited.add(start)\n # Process node here\n for neighbor in graph[start]:\n if neighbor not in visited:\n [FUNC_NAME](graph, neighbor, visited)\n return visited"
	},
	"Sliding Window": {
	"space": "O(1)",
	"explanation": "✅ EFFICIENT: Sliding window prevents duplicate work when analyzing subarrays.",
	"improvements": ["Maintains a running sum/condition without needing nested O(n^2) loops."],
	"optimized_code": "def [FUNC_NAME](arr, k):\n current_sum = 0\n left = 0\n for right in range(len(arr)):\n current_sum += arr[right]\n if right - left + 1 > k:\n current_sum -= arr[left]\n left += 1\n return current_sum"
	},
	"Two-Pointer Technique": {
	"space": "O(1)",
	"explanation": "✅ EFFICIENT: Two pointers walking towards each other saves incredible amounts of memory.",
	"improvements": ["Much faster than nested O(n^2) loops when dealing with sorted arrays."],
	"optimized_code": "def [FUNC_NAME](arr, target):\n left, right = 0, len(arr) - 1\n while left < right:\n s = arr[left] + arr[right]\n if s == target: return True\n elif s < target: left += 1\n else: right -= 1\n return False"
	},
	"Binary Search Tree": {
	"space": "O(n)",
	"explanation": "ℹ️ INFO: Operations are O(log n) on average, but can degrade to O(n) if the tree is unbalanced. Consider an AVL Tree or Red-Black Tree for guaranteed performance.",
	"improvements": ["Consider just using the built-in `dict` or `set` which are highly optimized Hash Tables in Python."],
	"optimized_code": "class Node:\n def __init__(self, key):\n self.left, self.right, self.val = None, None, key\n\ndef [FUNC_NAME](root, key):\n if root is None or root.val == key: return root\n if root.val < key: return [FUNC_NAME](root.right, key)\n return [FUNC_NAME](root.left, key)"
	},
	"Stack Operations": {
	"space": "O(n)",
	"explanation": "✅ OPTIMAL: Push/Pop operations are O(1).",
	"improvements": ["Standard Python lists are perfect for stacks. Just ensure you only use `.append()` and `.pop()`."],
	"optimized_code": "def [FUNC_NAME]():\n stack = []\n stack.append('item') # Push O(1)\n item = stack.pop() # Pop O(1)\n return item"
	},
	"Queue (List)": {
	"space": "O(n)",
	"explanation": "⚠️ WARNING: Using `list.pop(0)` in Python is O(n). Use `collections.deque` for true O(1) queue operations.",
	"improvements": ["Import 'deque' from the collections module.", "Use 'popleft()' instead of 'pop(0)' to achieve O(1) constant time."],
	"optimized_code": "def [FUNC_NAME]([ARGS]):\n # Using list.pop(0) causes O(n) memory shifts\n queue = list([FIRST_ARG])\n queue.append('new_item')\n item = queue.pop(0) \n return item",
	"recommended_name": "Collections.deque (True O(1) Queue)",
	"recommended_code": "from collections import deque\ndef [FUNC_NAME]_optimized([ARGS]):\n queue = deque([FIRST_ARG])\n queue.append('new_item')\n # queue.popleft() is now O(1) instead of O(n)\n item = queue.popleft()\n return queue"
	},
	"Linked List (Singly)": {
	"space": "O(n)",
	"explanation": "ℹ️ INFO: Insertions are O(1) if you have the pointer, but searching is O(n).",
	"improvements": ["Linked lists are rarely used in standard Python because standard lists are dynamic arrays."],
	"optimized_code": "class Node:\n def __init__(self, data):\n self.data = data\n self.next = None\n\nclass LinkedList:\n def __init__(self):\n self.head = None\n def print_list(self):\n temp = self.head\n while temp:\n print(temp.data)\n temp = temp.next"
	},
	"Linked List (Doubly)": {
	"space": "O(n)",
	"explanation": "✅ FLEXIBLE: Doubly Linked Lists allow bidirectional traversal, at the cost of slightly more memory.",
	"improvements": ["Python's built-in `collections.deque` is actually a Doubly Linked List under the hood! Use it for max performance."],
	"optimized_code": "from collections import deque\n# deque is an optimized doubly linked list\ndef [FUNC_NAME]():\n dll = deque(['a', 'b', 'c'])\n dll.append('d') # Add to right\n dll.appendleft('z') # Add to left\n return dll"
	}
	}

	# 4. Fallback Data
	default_data = {
	"space": "O(N)",
	"explanation": f"CodeSense Engine Analysis: {ethan_summary}",
	"improvements": ["Analysis pending for this algorithm."],
	"optimized_code": "# Recognized Pattern. Specific optimization currently unavailable."
	}

	# Handle matching names (e.g. "Linear Search" vs "Linear Iterative" from different models)
	if algo == "Linear Iterative" and "Linear Search" in complexity_map:
	algo_key = "Linear Search"
	elif algo == "Recursive (Exponential)" and "Factorial (Recursive)" in complexity_map:
	algo_key = "Fibonacci Sequence" # General fallback for exponential recursion
	else:
	algo_key = algo

	result_data = complexity_map.get(algo_key, default_data)

	# --- YOUR MAGIC VARIABLE REPLACEMENT FOR BOTH CODES ---
	# 1. Format Optimized Code
	opt_code = result_data.get("optimized_code", "").replace("[FUNC_NAME]", analyzer.func_name).replace("[ARGS]", analyzer.args_string).replace("[FIRST_ARG]", analyzer.first_arg)

	# 2. Format Recommended Code (if it exists)
	rec_code = result_data.get("recommended_code", "")
	if rec_code:
	rec_code = rec_code.replace("[FUNC_NAME]", analyzer.func_name).replace("[ARGS]", analyzer.args_string).replace("[FIRST_ARG]", analyzer.first_arg)
	rec_name = result_data.get("recommended_name", "")

	# 5. Send EVERYTHING back to VS Code
	return jsonify({
	"algorithm": algo,
	"confidence": f"{conf_percentage:.1f}%",
	"dynamic_complexity": dynamic_comp,
	"space_complexity": result_data.get("space", "O(N)"),
	"explanation": result_data.get("explanation", ""),
	"improvements": result_data.get("improvements", []),
	"optimized_code": opt_code,
	"recommended_name": rec_name,
	"recommended_code": rec_code,
	"safety_net_used": safety_net_triggered
	})

	except Exception as e:
	import traceback
	print(traceback.format_exc())
	return jsonify({"error": str(e)}), 500

	if __name__ == '__main__':
	app.run(host='0.0.0.0', port=7860)