Spaces:

layGkoder
/

mcphunter

Running

Anshul Ghate

Initial Commit

0e6b624 14 days ago

7.85 kB

	"""SHIELD Diagnostic Script — full state analysis of all 4 layers."""

	from __future__ import annotations

	import json
	import os
	import sys
	from pathlib import Path

	# Force UTF-8 output on Windows
	if sys.platform == "win32":
	sys.stdout.reconfigure(encoding="utf-8", errors="replace") # type: ignore[attr-defined]

	# Ensure project root is on sys.path
	project_root = Path(__file__).resolve().parent.parent
	sys.path.insert(0, str(project_root))

	from mcphunter.config import SEED_ATTACKS_PATH, SHIELD_CONFIG, ShieldConfig
	from mcphunter.shield.layer_heuristic import HeuristicLayer, _WEIGHTS
	from mcphunter.shield.layer_llm import LLMJudgeLayer
	from mcphunter.shield.models import Attack, Verdict
	from mcphunter.shield.pipeline import ShieldPipeline


	def load_seed_attacks() -> list[Attack]:
	data = json.loads(SEED_ATTACKS_PATH.read_text(encoding="utf-8"))
	return [Attack.from_dict(a) for a in data]


	def section(title: str) -> None:
	print(f"\n{'='*70}")
	print(f" {title}")
	print(f"{'='*70}\n")


	def main() -> None:
	attacks = load_seed_attacks()

	# -----------------------------------------------------------------------
	# Step 1 & 2: Find evading attacks and show heuristic scores
	# -----------------------------------------------------------------------
	section("1. EVADING ATTACKS (L1-L3 deterministic scan)")

	# Use L1-L3 only pipeline for deterministic baseline
	config_no_llm = ShieldConfig(llm_layer_enabled=False)
	pipeline_l123 = ShieldPipeline(config=config_no_llm)
	heuristic = HeuristicLayer()

	evading: list[Attack] = []
	for a in attacks:
	result = pipeline_l123.scan(a.payload)
	if result.verdict == Verdict.SAFE:
	evading.append(a)

	detected_l123 = len(attacks) - len(evading)
	print(f"Detected by L1-L3: {detected_l123}/{len(attacks)} ({detected_l123/len(attacks):.0%})")
	print(f"Evading (SAFE): {len(evading)}/{len(attacks)}")
	print()

	for a in evading:
	payload_preview = a.payload[:80].replace("\n", "\\n")
	print(f" {a.id:20s} \| {a.attack_type.value:3s} \| {payload_preview}...")

	section("2. HEURISTIC SCORES FOR EVADING ATTACKS")

	print(f" {'ID':20s} \| {'entropy':>7s} \| {'hidden':>7s} \| {'instr':>7s} \| {'urls':>7s} \| {'length':>7s} \| {'auth':>7s} \| {'TOTAL':>7s}")
	print(f" {'-'20}-+-{'-'7}-+-{'-'7}-+-{'-'7}-+-{'-'7}-+-{'-'7}-+-{'-'7}-+-{'-'7}")

	for a in evading:
	scores = heuristic._compute_feature_scores(a.payload)
	ws = sum(scores[f] * _WEIGHTS[f] for f in _WEIGHTS)
	print(
	f" {a.id:20s} \| {scores['entropy']:7.3f} \| {scores['hidden_char_ratio']:7.3f} \| "
	f"{scores['instruction_density']:7.3f} \| {scores['url_count']:7.3f} \| "
	f"{scores['length_anomaly']:7.3f} \| {scores['authority_markers']:7.3f} \| {ws:7.3f}"
	)

	# -----------------------------------------------------------------------
	# Step 3: API key check
	# -----------------------------------------------------------------------
	section("3. GEMINI API KEY STATUS")

	api_key = os.environ.get("GEMINI_API_KEY", "")
	if api_key:
	print(f" Key found (length={len(api_key)}, starts with {api_key[:8]}...)")
	has_key = True
	else:
	print(" Key missing — set GEMINI_API_KEY environment variable")
	has_key = False

	# -----------------------------------------------------------------------
	# Step 4: Layer 4 alone on first 3 evading attacks
	# -----------------------------------------------------------------------
	section("4. LAYER 4 (LLM JUDGE) ON FIRST 3 EVADING ATTACKS")

	if not has_key:
	print(" SKIPPED — no API key available")
	elif len(evading) == 0:
	print(" SKIPPED — no evading attacks to test")
	else:
	llm_layer = LLMJudgeLayer()
	test_attacks = evading[:3]
	for a in test_attacks:
	print(f" Testing: {a.id} ({a.attack_type.value})")
	print(f" Payload: {a.payload[:100].replace(chr(10), '\\n')}...")
	result = llm_layer.scan(a.payload)
	if result:
	print(f" Verdict: {result.verdict.value} (confidence={result.confidence:.2f})")
	print(f" Explanation: {result.explanation}")
	else:
	print(f" Verdict: safe (LLM returned no detection)")
	print()

	# -----------------------------------------------------------------------
	# Step 5: Full 4-layer pipeline on all 50 attacks
	# -----------------------------------------------------------------------
	section("5. FULL 4-LAYER PIPELINE (ALL 50 SEED ATTACKS)")

	if not has_key:
	print(" SKIPPED — no API key; showing L1-L3 results only")
	print(f" Detection rate (L1-L3): {detected_l123}/{len(attacks)} ({detected_l123/len(attacks):.0%})")
	print(f" Layer breakdown: L1={pipeline_l123.stats.layer1_catches} L2={pipeline_l123.stats.layer2_catches} L3={pipeline_l123.stats.layer3_catches}")
	else:
	pipeline_full = ShieldPipeline(config=SHIELD_CONFIG)
	by_type: dict[str, list[int]] = {}
	newly_caught: list[tuple[Attack, str]] = []

	for a in attacks:
	result = pipeline_full.scan(a.payload)
	t = a.attack_type.value
	by_type.setdefault(t, [0, 0])
	by_type[t][0] += 1
	if result.verdict != Verdict.SAFE:
	by_type[t][1] += 1
	if result.layer_triggered == "layer4_llm":
	newly_caught.append((a, result.explanation))

	total = sum(v[0] for v in by_type.values())
	detected = sum(v[1] for v in by_type.values())

	print(f" Overall detection rate: {detected}/{total} ({detected/total:.0%})")
	print()
	print(f" Layer breakdown:")
	print(f" L1 (regex): {pipeline_full.stats.layer1_catches}")
	print(f" L2 (encoding): {pipeline_full.stats.layer2_catches}")
	print(f" L3 (heuristic): {pipeline_full.stats.layer3_catches}")
	print(f" L4 (LLM): {pipeline_full.stats.layer4_catches}")
	print(f" Safe (missed): {pipeline_full.stats.safe_count}")
	print()

	print(f" Per-type breakdown:")
	for t in sorted(by_type):
	c, d = by_type[t]
	status = "PERFECT" if d == c else f"{c - d} missed"
	print(f" {t}: {d}/{c} ({status})")

	if newly_caught:
	print(f"\n Newly caught by Layer 4 ({len(newly_caught)} attacks):")
	for a, explanation in newly_caught:
	print(f" {a.id} ({a.attack_type.value}): {explanation[:100]}")

	# -----------------------------------------------------------------------
	# Step 6: Pipeline configuration
	# -----------------------------------------------------------------------
	section("6. PIPELINE CONFIGURATION")

	config = SHIELD_CONFIG
	print(f" Layer 1 (Regex): {'ENABLED' if config.regex_layer_enabled else 'DISABLED'}")
	print(f" Layer 2 (Encoding): {'ENABLED' if config.encoding_layer_enabled else 'DISABLED'}")
	print(f" Layer 3 (Heuristic): {'ENABLED' if config.heuristic_layer_enabled else 'DISABLED'}")
	print(f" Layer 4 (LLM): {'ENABLED' if config.llm_layer_enabled else 'DISABLED'}")
	print()
	print(f" Execution order: L1 -> L2 -> L3 -> L4 (short-circuit on first detection)")
	print(f" L4 model: {config.llm_judge_config.model_name}")
	print(f" L4 rate limit: {config.llm_judge_config.requests_per_day} RPD")
	print(f" L4 retry attempts: {config.llm_judge_config.retry_max_attempts}")
	print(f" L4 temperature: {config.llm_judge_config.temperature}")

	print(f"\n{'='*70}")
	print(f" DIAGNOSTIC COMPLETE")
	print(f"{'='*70}\n")


	if __name__ == "__main__":
	main()