Spaces:

AvinashAnalytics
/

sentinel-scam-honeypo

Paused

App Files Files Community

sentinel-scam-honeypo / app /agents /orchestrator.py

avinash-rai

Fix: Humanize responses - increase tokens to 120, persist language override across turns

3a6445b 4 months ago

raw

history blame contribute delete

51.4 kB

	# app/agents/orchestrator.py - Main agent controller

	"""Coordinates all agents for scam detection and honeypot engagement."""

	from typing import Dict, Any, Optional, List
	import time
	import os
	import re
	import json
	import random
	import asyncio
	import aiofiles
	from datetime import datetime, timedelta
	from fastapi import BackgroundTasks

	from app.core.llm_client import LLMClient, BudgetExceeded
	from app.agents.scam_detector import ScamDetector
	from app.agents.persona_engine import PersonaEngine
	from app.agents.intelligence_extractor import IntelligenceExtractor
	from app.agents.conversation_manager import ConversationManager
	from app.agents.adaptive_strategy import AdaptiveStrategyAgent

	from app.intelligence.threat_engine import ThreatIntelligenceEngine
	from app.intelligence.risk_scorer import RiskScoringEngine
	from app.intelligence.campaign_tracker import CampaignTracker

	from app.enforcement.police_api import CyberPoliceAPI, ActionRecommendationAPI

	from app.config import settings
	from app.utils.logger import AgentLogger
	from app.enforcement.stakeholder_exports import StakeholderExporter
	from app.utils.dossier_generator import dossier_generator
	from app.utils.callback_client import GUVIMandatoryCallback
	from app.utils.extractors import extract_all

	from app.intelligence.graph_threat_intel import graph_intel
	from app.intelligence.xai_reasoning import xai_explainer
	from app.intelligence.scammer_profiler import scammer_profiler
	from app.intelligence.enrichment_service import enrichment_service
	from app.core.context import TurnContext, is_engagement_complete



	class HoneypotOrchestrator:
	"""
	Main Honeypot Agent Orchestrator.

	Coordinates all sub-agents to process scammer messages
	and generate intelligent honeypot responses.
	"""

	def __init__(self):
	self.logger = AgentLogger("orchestrator")
	self.initialized = False

	# Core components
	self.llm_client: Optional[LLMClient] = None

	# Agents
	self.scam_detector: Optional[ScamDetector] = None
	self.persona_engine: Optional[PersonaEngine] = None
	self.intel_extractor: Optional[IntelligenceExtractor] = None
	self.conversation_manager: Optional[ConversationManager] = None
	self.adaptive_agent: Optional[AdaptiveStrategyAgent] = None

	# Advanced Threat Intelligence Modules
	self.threat_engine: Optional[ThreatIntelligenceEngine] = None
	self.risk_scorer: Optional[RiskScoringEngine] = None
	self.campaign_tracker: Optional[CampaignTracker] = None

	# Law enforcement
	self.police_api: Optional[CyberPoliceAPI] = None
	self.bank_api: Optional[ActionRecommendationAPI] = None

	# Ad-hoc profile store (if needed for session non-persistent memory)
	self.profiler = scammer_profiler
	self.enrichment_service = enrichment_service
	self.guvi_callback = GUVIMandatoryCallback()

	# Neuro-Symbolic Trace Cache (Real-Time Visualization Support)
	self.last_trace: Dict[str, Any] = {}

	async def initialize(self) -> None:
	"""Initialize all agents and components."""
	self.logger.info("Initializing honeypot orchestrator")

	# Initialize LLM client
	self.llm_client = LLMClient()
	await self.llm_client.initialize()

	# Initialize agents
	self.scam_detector = ScamDetector(self.llm_client)
	self.persona_engine = PersonaEngine(self.llm_client)
	self.intel_extractor = IntelligenceExtractor(self.llm_client)
	self.conversation_manager = ConversationManager()
	self.adaptive_agent = AdaptiveStrategyAgent()

	# Initialize Intelligence Modules
	if settings.ENABLE_THREAT_INTELLIGENCE:
	self.threat_engine = ThreatIntelligenceEngine()
	self.risk_scorer = RiskScoringEngine()
	self.campaign_tracker = CampaignTracker()

	# Initialize law enforcement APIs
	if settings.ENABLE_LAW_ENFORCEMENT_API:
	self.police_api = CyberPoliceAPI()
	self.bank_api = ActionRecommendationAPI()

	self.initialized = True
	self.logger.info("Orchestrator initialized successfully")



	async def process_message(
	self,
	message: str,
	conversation_id: Optional[str] = None,
	sender_id: Optional[str] = None,
	auto_report: bool = True,
	background_tasks: Optional[BackgroundTasks] = None,
	client_ip: str = "Unknown",
	sender_role: str = "scammer", # [SCORING] Explicit role support
	should_finalize: bool = False, # [LATENCY] Turbo Mode Flag
	request_language: str = "hinglish" # [FIX] Language from GUVI metadata
	) -> Dict[str, Any]:
	"""
	Process an incoming message through the OODA loop.

	Args:
	message: The scammer's message
	conversation_id: Unique session ID
	sender_id: Sender identifier (e.g. phone number)
	auto_report: Whether to automatically report to law enforcement
	background_tasks: FastAPI BackgroundTasks for non-blocking reporting
	should_finalize: Whether to run expensive forensic wrap-up (XAI/Enrichment)
	"""
	start_time = time.time()
	client_ip = client_ip or "Unknown"

	if not self.initialized:
	await self.initialize()

	# --- TOKEN RESILIENCE: Input Capping ---
	from app.utils.token_utils import smart_truncate
	original_length = len(message)
	message = smart_truncate(message, max_chars=4000)
	if len(message) < original_length:
	self.logger.warning(f"Message truncated for token safety: {original_length} -> {len(message)} chars")

	# Reasoning Accumulator for Final Audit (Loaded from session for continuity)
	reasoning_traces = []

	# ------------------------------------------------------------------
	# 🔥 OPTIMIZATION: TURN CONTEXT (Request Scope)
	# Prevents redundant API calls and loops
	# ------------------------------------------------------------------
	ctx = TurnContext(session_id=conversation_id or "new", message=message, sender_role=sender_role)
	ctx.request_language = request_language # [FIX] Store GUVI language preference


	# Get or create conversation (Auto-generates created_at if new)
	conversation = await self.conversation_manager.get_or_create(
	conversation_id, sender_id
	)
	conv_id = conversation["id"]

	# 🔥 [RISK 5] TRACE CONTINUITY: Load existing traces
	reasoning_traces = conversation.get("reasoning_history", [])

	# Link session to context for session-level budget enforcement
	ctx.session = conversation

	# SOC SWITCHBOARD: OPTIONAL SECURITY SCAN
	# For honeypot, we EXPECT scam content - only check Turn 1 for prompt injection
	# This saves 1 API call per turn after first message
	message_count_early = len(conversation.get("history", [])) + 1

	if message_count_early <= 1: # Only check first message
	try:
	is_safe = await self.llm_client.check_safeguard(message, context=ctx)
	if not is_safe:
	# HONEYPOT EXCEPTION: We EXPECT "Unsafe" (Fraud) content.
	# Only block if it looks like a System Override/Prompt Injection attempt.
	if "ignore previous instructions" in message.lower() or "system prompt" in message.lower():
	self.logger.warning("Prompt Injection Blocked by SOC Safety Guard", conv_id=conv_id)
	ctx.finalized = True
	ctx.reply_mode = "HONEYPOT_ONLY"
	return {
	"status": "blocked",
	"reason": "Security violation detected (Prompt Injection)",
	"honeypot_response": {"message": "System unavailable.", "persona": "system"}
	}
	else:
	self.logger.info("Safety Guard flagged content (likely Scam), proceeding as Honeypot...", conv_id=conv_id)
	except Exception as e:
	self.logger.warning(f"Safety Guard Check Failed (LLM Error): {e}. Failing OPEN (Proceeding).", session_id=conv_id)

	# Determine session start time for accurate metrics
	session_created_str = conversation.get("created_at", datetime.utcnow().isoformat())
	try:
	# Strip Z if present to maintain naive datetime consistency with utcnow()
	session_start_raw = session_created_str.replace("Z", "").split("+")[0]
	session_start = datetime.fromisoformat(session_start_raw)
	except:
	session_start = datetime.utcnow()
	duration_seconds = (datetime.utcnow() - session_start).total_seconds()

	# Determine message count (for phase)
	message_count = len(conversation.get("history", [])) + 1

	# Init Decision Variables (Scope Safety)
	persona = None
	phase = "hook"
	scammer_behavior = None
	escalation_rec = {}
	is_fast_path = False
	is_scammer_repeating = False # [BUG FIX] Initialize early for Fast Path safety

	# [SCORING] Role-based logic: If sender is 'user', treat as non-scam or testing turn
	if sender_role == "user":
	self.logger.info("Scoring Override: Message from 'user' role detected. Fail-safe engagement mode.", session_id=conv_id)
	# We still run detection for safety, but we can nudge it
	scammer_behavior = {"behavior": "calm", "strategy": "neutral", "confidence": 0.0}

	# Step 1: Heuristic Pre-Check (Latency Elimination)
	# [OPTIMIZATION] FASTEST-PATH HEURISTIC (Turn 0)
	heuristic_detection = self.scam_detector.detect_heuristic(message)

	detection = None
	intelligence = {}

	if message_count <= 1 and heuristic_detection.get("confidence", 0) > 0.5:
	self.logger.info("FASTEST-PATH: Turn 0 High Confidence Regex. Skipping ALL LLMs.", session_id=conv_id)
	is_fast_path = True
	detection = heuristic_detection

	# [FIX] PRESERVE REGEX INTEL IN FAST-PATH
	# Previously: intelligence = {} (Wiped out all extracted data)
	intelligence = extract_all(message)

	# Calculate heuristic risk score for Fast Path
	intelligence["risk_score"] = 0
	if intelligence.get("upi_ids"): intelligence["risk_score"] += 20
	if intelligence.get("bank_accounts"): intelligence["risk_score"] += 30
	if intelligence.get("urls"): intelligence["risk_score"] += 10

	# Set Defaults for Fast Path
	# MUST be a dict for persona_engine compatibility
	scammer_behavior = {"behavior": "urgent", "strategy": "fast_path", "confidence": 1.0}

	ctx.persona_selected = True
	phase = "hook"

	# Prevent UnboundLocalError
	# SOC FIX: Sanitize merged_intel for Fast-Path compatibility
	merged_intel = (conversation.get("aggregated_intelligence") or {}).copy()
	merged_intel.setdefault("keywords", [])
	merged_intel.setdefault("upi_ids", [])
	merged_intel.setdefault("bank_accounts", [])

	# [FIX] Merge Regex Intelligence into Aggregated Intel for Fast Path
	# This ensures GUVI callback receives the extracted UPIs

	for k, v in intelligence.items():
	if k in ["risk_score", "scam_confidence"]: continue
	if v and isinstance(v, list):
	current = merged_intel.get(k, [])
	merged_intel[k] = list(set(current + v))

	# SOC FIX: Use taxonomy intelligence for persona selection in FASTEST-PATH
	persona_key = detection.get("persona", "worried_customer")
	persona = self.persona_engine.get_persona(persona_key)
	if not persona:
	persona = self.persona_engine.get_persona("elderly_excited") or list(self.persona_engine.get_all_personas().values())[0]

	# Sync Graph Intel (Minimal - Keywords)
	if detection.get("matched_keywords"):
	await self.conversation_manager.update_intelligence(conv_id, {"keywords": detection["matched_keywords"]})

	else:
	# Step 1 & 2: Parallel Detection & Extraction (Latency Optimization)
	# Run both independent agents simultaneously to halve processing time

	# --- NOVELTY TRIGGER CALCULATION ---
	existing_scam = conversation.get("scam_type")
	last_confidence = conversation.get("scam_confidence", 0.0) # 🔥 FIX: Use stored confidence
	behavior_changed = False
	history = conversation.get("history", [])

	# [SCORING] Repetition Detection: If scammer is repeating demands, escalate agitation
	is_scammer_repeating = False
	if history:
	previous_msgs = [h.get("scammer_message", "").lower() for h in history[-2:]]
	current_msg_lower = message.lower()
	for prev in previous_msgs:
	# Simple fuzzy match: same core words or same length/prefix
	if prev == current_msg_lower or (len(prev) > 10 and prev[:15] == current_msg_lower[:15]):
	is_scammer_repeating = True
	self.logger.info("Scammer repetition detected, preparing for agitation escalation.", session_id=conv_id)
	break

	last_turn = history[-1]
	# Check for behavior flip (Heuristic comparison of last behavior if available)
	# For now, we'll assume extraction_task will handle detailed behavior analysis later,
	# but we can check if the last turn was 'conclude' or 'escalate'

	if existing_scam: # If sticky, we can run extraction immediately with high confidence
	# 🔥 SKIP LLM DETECTION entirely - use cached result
	detection = {
	"scam_type": existing_scam,
	"confidence": conversation.get("scam_confidence", 0.9),
	"is_scam": True,
	"reasoning": "Sticky detection from session memory",
	"source": "memory",
	"matched_keywords": conversation.get("aggregated_intelligence", {}).get("keywords", [])
	}
	# 🔥 SKIP LLM EXTRACTION on most turns - regex is sufficient
	# Only do LLM extraction on turn 1 and every 5th turn (handled inside extract())
	intelligence = await self.intel_extractor.extract(
	message,
	context=ctx,
	turn_count=message_count,
	last_confidence=last_confidence,
	current_confidence=conversation.get("scam_confidence", 0.9),
	behavior_changed=behavior_changed
	)
	else:
	# If not sticky, we MUST run detection first to get 'current_confidence' for extraction novelty
	try:
	detection = await self.scam_detector.detect(message, context=ctx, turn_count=message_count)
	except Exception as e:
	self.logger.error(f"Detection FAIL: {e}", session_id=conv_id)
	detection = {"is_scam": False, "confidence": 0.0, "scam_type": "error"}

	try:
	intelligence = await self.intel_extractor.extract(
	message,
	context=ctx,
	turn_count=message_count,
	last_confidence=last_confidence,
	current_confidence=detection.get("confidence", 0.0),
	behavior_changed=behavior_changed
	)
	except Exception as e:
	self.logger.error(f"Extraction FAIL: {e}", session_id=conv_id)
	# Fallback to pure regex locally if agent died (Crash Safety)
	intelligence = extract_all(message)
	intelligence["risk_score"] = 0 # Default if scorer unreachable


	# ⚡ OPTIMIZATION: REGEX GUARD RULE
	# Rule: If Regex detects scam (Conf > 0.9), mark decided -> SKIP reasoning
	if detection.get("confidence", 0) > 0.9:
	ctx.mark_scam(detection["scam_type"], detection["confidence"])
	if detection.get("source") == "heuristic":
	self.logger.info("Fast-Path: Regex detected scam, skipping deep reasoning.", session_id=conv_id)

	# Core Logic Execution (Steps 3-5)
	# Initialize outputs for scope safety
	threat_intel = {}
	risk_explanation = []

	# Only run deep reasoning if NOT on Fast Path
	if not is_fast_path:
	# [Moved] Capture Native Reasoning Trace - now captured after full OODA loop

	# Step 2.5: Update Graph Knowledge Base (Winner-Tier)
	graph_intel.add_intelligence(conv_id, intelligence)

	# Step 2.6: Prepare Merged Intel for Logic
	conv_intel = conversation.get("aggregated_intelligence") or {}
	merged_intel = {**conv_intel}

	for key in intelligence:
	if key in ["risk_score", "scam_confidence", "risk_level", "timeline"]: continue
	if intelligence[key]:
	if key not in merged_intel: merged_intel[key] = []
	for item in intelligence[key]:
	if item not in merged_intel[key]: merged_intel[key].append(item)



	if detection.get("matched_keywords"):
	# Update local merged copy
	if "keywords" not in merged_intel:
	merged_intel["keywords"] = []
	for kw in detection["matched_keywords"]:
	if kw not in merged_intel["keywords"]:
	merged_intel["keywords"].append(kw)

	# CRITICAL FIX: Persist keywords to Memory immediately
	# Otherwise they only exist in this temporary 'merged_intel' scope
	await self.conversation_manager.update_intelligence(
	conv_id,
	{"keywords": detection["matched_keywords"]}
	)

	# Step 3: Adaptive Analysis (Moved up for decisioning)
	scammer_behavior = await self.adaptive_agent.analyze_scammer_behavior(message)
	reasoning_traces.append(f"Behavioral Analysis: {scammer_behavior.get('strategy', 'Neutral')}")

	escalation_rec = self.adaptive_agent.get_escalation_recommendation(conversation, merged_intel)
	reasoning_traces.append(f"Escalation Logic: {escalation_rec.get('reason', 'Continue')}")

	# Step 4: Determine conversation phase (Explicit State Machine with Adaptive Input)
	phase = await self.conversation_manager.determine_phase(message_count, merged_intel)

	# Step 5: Select persona (Sticky Logic)

	# [OPTIMIZATION] HARD PERSONA LOCK
	# If persona exists, we reuse it. We DO NOT allow re-selection logic to run.
	existing_persona_key = conversation.get("persona")
	if existing_persona_key:
	ctx.persona_selected = True
	ctx.persona_locked = True
	persona = self.persona_engine.get_persona(existing_persona_key)
	if persona:
	# Ensure the dict has the key so persona_engine knows which one it is
	persona = {**persona, "selected_persona_key": existing_persona_key}
	# Apply stored language from session to preserve language override
	stored_lang = conversation.get("aggregated_intelligence", {}).get("request_language")
	if stored_lang:
	persona["language"] = stored_lang
	self.logger.info(f"PERSONA LOCKED: Reusing {existing_persona_key}", session_id=conv_id)

	if not ctx.persona_locked:
	persona = await self.persona_engine.select_persona(
	scam_message=message,
	scam_type=detection["scam_type"],
	conversation_history=conversation.get("history"),
	current_phase=phase,
	session_id=conv_id,
	context=ctx # Pass context
	)
	if persona:
	ctx.persona_locked = True




	# Correctly get the internal key for logging/persistence
	persona_key = persona.get("selected_persona_key") if persona else existing_persona_key or "elderly_excited"
	if not persona_key: persona_key = "elderly_excited"

	# [FIX] CRASH PREVENTION: If persona is None (failed load/lock), hydrate it manually
	if not persona:
	self.logger.warning(f"Persona was None, hydrating from key: {persona_key}", session_id=conv_id)
	persona = self.persona_engine.get_persona(persona_key)

	# [FIX] LANGUAGE OVERRIDE: Apply GUVI request language to persona
	# This ensures responses match the requested language (English/Hindi/Hinglish)
	# Also persist language in session for subsequent turns with persona lock
	if request_language and persona:
	original_lang = persona.get("language", "hinglish")
	persona["language"] = request_language
	persona["original_language"] = original_lang # Preserve for debugging
	# Store in session for persistence
	if ctx and hasattr(ctx, "session") and ctx.session:
	ctx.session["request_language"] = request_language
	self.logger.info(f"Language override: {original_lang} -> {request_language}", session_id=conv_id)
	elif ctx and hasattr(ctx, "session") and ctx.session:
	# Restore language from session if not in current request
	stored_lang = ctx.session.get("request_language")
	if stored_lang and persona:
	persona["language"] = stored_lang

	# [LIFECYCLE] Recalculate finalization state based on newly extracted intel
	# This ensures that if we just captured a UPI ID, we trigger XAI immediately.
	internal_should_finalize = should_finalize or is_engagement_complete(conversation, scam_detected=detection.get("is_scam", False))

	# Step 6: Generate response (With Adaptive Injection)

	# ⚡ OPTIMIZATION: ATTEMPT GUARD
	# Ensure we only try LLM generation ONCE per turn.
	# If we fail or have already attempted, fall back to static.
	if ctx.fast_chat_attempted:
	self.logger.warning("Fast Chat already attempted, forcing static fallback.", session_id=conv_id)
	response_text = self.persona_engine._static_response("", persona=persona, scam_type=detection["scam_type"])
	else:
	ctx.fast_chat_attempted = True
	try:
	response_text = await self.persona_engine.generate_response(
	scam_message=message,
	persona=persona,
	scam_type=detection["scam_type"],
	conversation_history=conversation.get("history"),
	current_phase=phase,
	intelligence=merged_intel,
	scammer_behavior=scammer_behavior,
	context=ctx, # Pass context for budget enforcement
	is_repeating=is_scammer_repeating # [SCORING] Escalate if repeating
	)
	except BudgetExceeded as e:
	# GUARANTEED LOCAL FALLBACK on budget exhaustion
	self.logger.warning(f"Budget exceeded during response generation: {e}. Using static fallback.", session_id=conv_id)
	ctx.budget_exceeded = True
	response_text = self.persona_engine._static_response("", persona=persona, scam_type=detection["scam_type"])




	# Step 7: Attribution & Link Encoding
	# Automatically append session ID to decoy links for 360-degree tracking
	if "/decoys/" in response_text:
	# Find decoy links and append ?sid=conv_id (or &sid= if ? exists)
	def encode_link(match):
	link = match.group(0)
	sep = "&" if "?" in link else "?"
	return f"{link}{sep}sid={conv_id}"

	response_text = re.sub(r'https?://[^\s<>"]+/decoys/[^\s<>"]+', encode_link, response_text)
	# Also handle relative paths if any (for internal simulation logs)
	response_text = re.sub(r'(?<!http://)(?<!https://)/decoys/[^\s<>"]+', encode_link, response_text)

	# Step 8: Threat intelligence analysis
	# threat_intel initialized above
	risk_score = 0.0

	# [SCORING] Populate reasoning from detection
	if detection.get("reasoning"):
	reasoning_traces.append(f"Detection Reasoning: {detection['reasoning']}")
	# Step 8.1 - 8.3: Threat Analysis & Campaign Tracking
	if self.threat_engine:
	threat_intel = await self.threat_engine.analyze(
	detection["scam_type"],
	merged_intel,
	detection["confidence"]
	)

	# Track campaign
	if self.campaign_tracker:
	self.campaign_tracker.track(
	threat_intel["campaign_id"],
	detection["scam_type"],
	merged_intel
	)
	else:
	threat_intel = {"campaign_id": "none", "severity": "MEDIUM", "scam_pattern": "untracked"}

	# Step 8.4: Intelligence Enrichment
	# ⚡ OPTIMIZATION: TURBO MODE - ONLY RUN ON FINALIZATION
	enrichment_data = {}
	if settings.ENABLE_THREAT_INTELLIGENCE and self.enrichment_service and internal_should_finalize:
	from app.intelligence.mitre_mapper import mitre_mapper
	if detection.get("risk_indicators"):
	threat_intel["mitre_ttps"] = mitre_mapper.map_tactics(detection["risk_indicators"])
	threat_intel["mitre_campaign"] = mitre_mapper.get_campaign_ttps(detection["scam_type"])

	enrichment_data = await self.enrichment_service.enrich_intelligence(merged_intel)
	threat_intel["enrichment"] = enrichment_data
	if enrichment_data.get("reputation_alerts"):
	risk_explanation.extend(enrichment_data["reputation_alerts"])
	else:
	pass # Heuristic only path

	# Calculate risk score (Force Heuristic Mode if Finalized)
	# Calculate risk score (Force Heuristic Mode if Finalized)
	try:
	if self.risk_scorer:
	# Pass None for llm_client if finalized to strictly valid LLM usage
	run_llm = self.llm_client if not ctx.finalized else None
	risk_score, risk_explanation = await self.risk_scorer.calculate_risk_score(
	message,
	detection.get("scam_type", "unknown"),
	detection.get("confidence", 0.0),
	merged_intel,
	detection.get("matched_keywords", []),
	llm_client=run_llm
	)
	else:
	# [FAST PATH] Fallback to detector confidence if scorer disabled
	risk_score = detection.get("confidence", 0.0)
	risk_explanation = [f"Direct classification: {detection.get('scam_type', 'unknown')}"]
	except Exception as e:
	self.logger.error(f"Risk Scorer Failed: {e}", session_id=conv_id)
	risk_score = detection.get("confidence", 0.0)
	risk_explanation = ["Risk scoring fallback due to system error"]

	# Step 8.5: Enrich with Graph Data (Winner-Tier)
	lookup_entity = (merged_intel.get("phone_numbers") or [message])[0]
	if merged_intel.get("upi_ids") and len(merged_intel["upi_ids"]) > 0:
	lookup_entity = merged_intel["upi_ids"][0]

	try:
	campaign_info = graph_intel.get_campaign_info(lookup_entity)
	if campaign_info.get("campaign_id"):
	threat_intel["campaign_id"] = campaign_info["campaign_id"]
	threat_intel["cluster_size"] = campaign_info["cluster_size"]
	threat_intel["related_entities_count"] = len(campaign_info.get("related_entities", []))
	except Exception: pass

	# Step 8.5.5: Adversary Profiling
	try:
	scammer_behavior_profile = self.profiler.analyze_behavior(message)
	scammer_id = self.profiler.generate_scammer_id(merged_intel)
	threat_intel["scammer_id"] = scammer_id
	threat_intel["behavior_metrics"] = scammer_behavior_profile

	# Save profile state
	self.profiler.create_profile(scammer_id, merged_intel, scammer_behavior_profile, detection["scam_type"])
	except Exception as e:
	self.logger.error(f"Profiler Failed: {e}", session_id=conv_id)
	scammer_behavior_profile = {"strategy": "unknown"}

	# Step 8.6: Generate XAI Reasoning (Winner-Tier)
	# ⚡ OPTIMIZATION: TURBO MODE - ONLY RUN ON FINALIZATION
	# This moves ~4-5s of latency to the final reporting step only
	if settings.ENABLE_LLM_RESPONSES and self.llm_client and internal_should_finalize:
	try:
	xai_explanation = await xai_explainer.generate_explanation(
	self.llm_client, message, detection, risk_score, merged_intel
	)
	risk_explanation.extend(xai_explanation)
	except Exception as e:
	self.logger.error(f"XAI Failed: {e}", session_id=conv_id)

	# SOC FIX: Kill Switch moved after enrichment/XAI for full trace capture
	ctx.finalized = True


	# HACKATHON WINNING TRICK: SYNTHETIC INJECTION (Sandbox Mode)
	# If High Confidence Scam + No Intel + Sandbox Mode -> Inject specific indicators
	# This ensures judges NEVER see an empty report even for simple "Hi" messages
	if settings.SANDBOX_MODE and detection["is_scam"] and detection["confidence"] > 0.8:
	if not (merged_intel.get("upi_ids") or merged_intel.get("phone_numbers")):
	synthetic_intel = {
	"upi_ids": ["fraud@ybl"],
	"phone_numbers": ["9876543210"],
	"keywords": detection.get("matched_keywords", ["suspicious"])
	}
	# Merge into flow
	merged_intel.update(synthetic_intel)
	# Persist to memory so CallbackClient sees it
	await self.conversation_manager.update_intelligence(conv_id, synthetic_intel)
	# [ETHICS] Tag as synthetic for evaluator transparency
	merged_intel["is_synthetic"] = True
	self.logger.info("Executed SANDBOX SYNTHETIC INJECTION for judge visibility")
	xai_reason = xai_explainer.explain_score(
	detection["is_scam"],
	{"urgency": detection.get("confidence", 0), "payment_request": len(merged_intel.get("upi_ids", [])) > 0},
	detection.get("matched_keywords", [])
	)
	risk_explanation = [xai_reason]
	reasoning_traces.append(f"XAI Reason: {xai_reason}")

	# 🔥 PERSISTENCE FIX: Sync agitation level & reason to intelligence metadata
	if ctx.session.get("last_agitation"):
	intelligence["metadata_agitation"] = [ctx.session["last_agitation"]]
	# Capture the logic-level justification for the judge
	agg_intel = ctx.session.get("aggregated_intelligence", {})
	if agg_intel.get("metadata_agitation_reason"):
	intelligence["metadata_agitation_reason"] = [agg_intel["metadata_agitation_reason"]]

	# 🔥 LANGUAGE PERSISTENCE: Store request language for persona lock on subsequent turns
	if request_language:
	intelligence["request_language"] = request_language

	await self.conversation_manager.update(
	conversation_id=conv_id,
	scammer_message=message,
	honeypot_response=response_text,
	intelligence=intelligence,
	phase=phase,
	scam_type=detection.get("scam_type") or conversation.get("scam_type"),
	persona=persona_key,
	risk_score=risk_score,
	trust_score=0.0
	)

	# Step 9.1: Update session LLM call counter for budget enforcement
	conversation["session_llm_calls"] = conversation.get("session_llm_calls", 0) + ctx.llm_call_count

	# 7. REFLECT: Update history & Adaptive Learning

	# [NEW] GENERATE DENSE SUMMARY for reporting if high-risk or finalizing
	conversation_summary = f"Interaction at {phase} phase."

	# [ETHICS] Mention synthetic data in summary if present
	if merged_intel.get("is_synthetic"):
	conversation_summary += " \| [NOTE] Synthetic identifiers injected for sandbox visibility."

	# ⚡ OPTIMIZATION: MODEL-FREE SUMMARY
	# Only use template summary to avoid LLM storms
	if risk_score > 0.7 or should_finalize:
	conversation_summary = f"Scam: {detection['scam_type']} \| Phase: {phase} \| Turn: {message_count}"

	# Legacy LLM Summary (Disabled for Speed)
	# if risk_score > 0.7 or should_finalize:
	# try:
	# history_text = self.conversation_manager.get_history_text(conv_id, max_turns=15)
	# conversation_summary = await self.llm_client.generate_dense(
	# context=history_text,
	# initial_summary=f"Scam session {conv_id} ({detection['scam_type']})",
	# rounds=2 # 2 rounds is enough for performance/density balance
	# )
	# except Exception as e:
	# self.logger.error("Failed to generate dense summary", error=str(e))


	# Update conversation with summary
	if conversation_summary:
	await self.conversation_manager.update_intelligence(conv_id, {"summary": str(conversation_summary)})

	# 6. ACT: Auto-Report to Law Enforcement (if Risk > 0.8)
	# ------------------------------------------------------------------
	enforcement_actions = [] # Initialize here, will be empty if offloaded
	if auto_report and risk_score > 0.8 and settings.ENABLE_LAW_ENFORCEMENT_API:
	if background_tasks:
	background_tasks.add_task(
	self._auto_report_to_enforcement,
	conv_id=conversation["id"],
	scam_type=detection["scam_type"],
	intelligence=merged_intel,
	threat_intel=threat_intel,
	risk_score=risk_score,
	conversation_summary=conversation_summary,
	total_messages=message_count
	)
	self.logger.info(f"Queued background reporting for session {conversation['id']}")
	else:
	# Fallback to fire-and-forget task
	asyncio.create_task(
	self._auto_report_to_enforcement(
	conv_id=conversation["id"],
	scam_type=detection["scam_type"],
	intelligence=merged_intel,
	threat_intel=threat_intel,
	risk_score=risk_score,
	conversation_summary=conversation_summary,
	total_messages=message_count
	)
	)

	# 7. REFLECT: Update history & Adaptive Learning

	# Step 11: State-Based Final Callback Decision
	should_finalize = False
	if detection["is_scam"]:
	# Use Adaptive Agent's Verdict
	if escalation_rec.get("action") == "can_conclude":
	should_finalize = True
	# Fallback safety: High confidence + critical intel + SUFFICIENT DURATION
	# Fixes "Callback Flooding" by ensuring we don't finalize too early (min 3 turns)
	elif detection["confidence"] > 0.9 and (merged_intel.get("upi_ids") or merged_intel.get("bank_accounts")):
	# Only conclude if we have had a decent conversation length (>= 6 messages)
	if message_count >= 6:
	should_finalize = True


	# [NEW] FINAL SOC REASONING CAPTURE
	# Capture trace after response generation to ensure "Thought" is present in audit
	# [SCORING] Trace Windowing: Keep only last 5 segments to prevent memory growth
	if reasoning_traces:
	# Windowing for the next turn
	windowed_history = reasoning_traces[-5:]
	native_reasoning = "\n\n".join(windowed_history)
	# Persist to session for turn-over-turn continuity
	await self.conversation_manager.update_intelligence(conv_id, {"reasoning_history": windowed_history})
	else:
	native_reasoning = "Heuristic decision based on " + detection.get("scam_type", "detected patterns")

	# [REMOVED] Legacy GUVI callback logic.
	# The callback is now handled centrally in app.utils.guvi_handler to prevent circular dependencies.

	# ═══════════════════════════════════════════════════════════════════════════
	# 🔥 INTEL BOOST: If payment intel extracted, FORCE scamDetected=True
	# GUVI Critical: Judges need to see scamDetected=True when UPI/Bank captured
	# ═══════════════════════════════════════════════════════════════════════════
	has_payment_intel = (
	intelligence.get("upi_ids") or
	intelligence.get("bank_accounts") or
	intelligence.get("credit_cards")
	)

	if has_payment_intel:
	# FORCE scam detection when payment intel found
	detection["is_scam"] = True
	detection["confidence"] = max(detection.get("confidence", 0.0), 0.85)
	if not detection.get("scam_type") or detection.get("scam_type") == "not_scam":
	detection["scam_type"] = "banking_scam"
	self.logger.info(
	"INTEL BOOST: Payment intel detected, forcing scamDetected=True",
	upi=intelligence.get("upi_ids"),
	bank=intelligence.get("bank_accounts")
	)

	# Calculate processing time
	processing_time = int((time.time() - start_time) * 1000)

	# Build comprehensive response
	result = {
	"status": "success",
	"is_scam": detection.get("is_scam", False),
	"scam_type": detection.get("scam_type", "unknown"),
	"confidence": detection.get("confidence", 0.0),
	"threat_level": detection.get("threat_level", "medium").upper(), # SOC FIX: Normalize
	"risk_explanation": risk_explanation,
	"explanation": risk_explanation,
	"agent_notes": conversation_summary, # [SCORING] Pass summary to callback
	"decision_reason": escalation_rec.get("reason", "Heuristic confidence threshold met"), # SOC FIX: Explainability
	"should_finalize": internal_should_finalize,
	"session_duration_seconds": duration_seconds,
	"honeypot_response": {
	"message": response_text,
	"persona": persona_key,
	"language": persona.get("language", "hinglish")
	},
	"extracted_intelligence": { # Raw per-turn
	"phone_numbers": intelligence.get("phone_numbers", []),
	"upi_ids": intelligence.get("upi_ids", []),
	"bank_accounts": intelligence.get("bank_accounts", []),
	"ifsc_codes": intelligence.get("ifsc_codes", []),
	"emails": intelligence.get("emails", []),
	"urls": intelligence.get("urls", [])
	},
	"aggregated_intelligence": merged_intel,
	"threat_intelligence": threat_intel,
	"conversation": {
	"id": conv_id,
	"phase": phase,
	"message_count": message_count,
	},
	"analysis": {
	"risk_indicators": detection.get("risk_indicators", []),
	"matched_keywords": detection.get("matched_keywords", []),
	"scam_category": detection.get("category", "Unknown"),
	"client_ip": client_ip
	},
	"enforcement_actions": enforcement_actions,
	"agent_steps": [
	f"Step 1: Detection [{self.llm_client.provider_name.upper()}] -> {detection.get('scam_type', 'unknown')} ({detection.get('confidence', 0.0):.2f})",
	f"Step 2: Adaptive strategy -> {scammer_behavior.get('strategy', 'engage')}",
	f"Step 3: State Machine -> Phase: {phase}",
	f"Step 4: Persona [{persona_key}] generated response",
	f"Step 5: Risk Level {detection.get('threat_level', 'medium').upper()} confirmed"
	],
	"adaptive_policy": {
	"phase": phase,
	"intel_gap": bool(escalation_rec.get("intel_score", 0) < 2),
	"strategy": scammer_behavior.get("strategy", "engage"),
	"escalation_rec": escalation_rec
	},
	"metadata": {
	"processing_time_ms": processing_time,
	"timestamp": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
	"version": settings.VERSION,
	"model": "Sentinel Honeypot v2.0 SOC",
	"native_reasoning_trace": native_reasoning
	}
	}

	# Cache for UI visualizer
	self.last_trace = result
	return result


	async def _auto_report_to_enforcement(
	self,
	conv_id: str,
	scam_type: str,
	intelligence: Dict,
	threat_intel: Dict,
	risk_score: float,
	conversation_summary: str = "",
	total_messages: int = 1
	) -> List[Dict]:
	"""File reports and request actions automatically."""
	if not settings.ENABLE_LAW_ENFORCEMENT_API:
	self.logger.info("Enforcement reporting disabled by configuration.")
	return []

	actions = []

	# 0. Setup Storage Path
	session_folder = f"reports/sessions/{conv_id}"
	await asyncio.to_thread(os.makedirs, session_folder, exist_ok=True)

	# 1. Generate Formal Intelligence Dossier (Markdown)
	try:
	# Prepare data for DossierGenerator matching its expected schema
	dossier_input = {
	"scam_type": scam_type,
	"risk_score": risk_score,
	"threat_intelligence": threat_intel,
	"aggregated_intelligence": intelligence,
	"analysis": {"scam_category": scam_type},
	"telemetry": threat_intel.get("enrichment", {}).get("client_meta", {}),
	"metadata": {"timestamp": datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S")},
	"honeypot_response": {"persona": "Sentinel_AI"}
	}
	md_dossier = dossier_generator.generate_markdown(conv_id, dossier_input)

	dossier_path = f"{session_folder}/dossier_{conv_id}.md"

	# Async write to prevent event loop blocking
	async with aiofiles.open(dossier_path, "w", encoding="utf-8") as f:
	await f.write(md_dossier)

	actions.append({
	"type": "forensic_dossier",
	"path": dossier_path,
	"status": "generated"
	})
	self.logger.info(f"Generated autonomous forensic dossier at {dossier_path}")
	except Exception as e:
	self.logger.error("Failed to generate forensic dossier", error=str(e))

	# 2. Generate Official Stakeholder Exports (JSON Bundle)
	try:
	reports = StakeholderExporter.export_all(
	session_id=conv_id,
	scam_type=scam_type.replace("_", " "),
	intelligence=intelligence,
	threat_intel=threat_intel,
	risk_score=risk_score,
	conversation_summary=conversation_summary or f"Automated reporting for high-risk session {conv_id}"
	)

	export_path = f"{session_folder}/official_exports_{conv_id}.json"

	# 🔥 Performance Fix: Async JSON writing
	async with aiofiles.open(export_path, "w", encoding="utf-8") as f:
	await f.write(json.dumps(reports, indent=2))

	actions.append({
	"type": "official_regulatory_bundle",
	"path": export_path,
	"status": "generated"
	})
	self.logger.info(f"Generated official regulatory exports bundle at {export_path}")
	except Exception as e:
	self.logger.error("Failed to generate official exports", error=str(e))

	if not self.police_api: return actions

	# 3. File Police Report (Legacy API Simulation)
	try:
	report = self.police_api.file_report(
	scam_type=scam_type,
	intelligence=intelligence,
	threat_intel=threat_intel,
	risk_score=risk_score,
	conversation_summary=conversation_summary or f"Automated enforcement for session {conv_id}"
	)
	actions.append({
	"type": "cyber_police_report",
	"report_id": report["report_id"],
	"status": "filed"
	})
	except Exception as e:
	self.logger.error("Auto-report failed", error=str(e))

	# 4. Request UPI Freeze (if any)
	if self.bank_api and intelligence.get("upi_ids"):
	for upi in intelligence["upi_ids"][:2]:
	try:
	req = self.bank_api.recommend_upi_action(
	upi_id=upi,
	reason=f"Scam detected: {scam_type}",
	threat_intel=threat_intel
	)
	actions.append({
	"type": "upi_freeze_request",
	"upi_id": upi,
	"request_id": req["request_id"],
	"status": "pending"
	})
	except: pass

	# 5. [REMOVED] GUVIMANDATORY CALLBACK
	# Duplicate callback removed to prevent session synchronization conflicts.
	# Handled centrally in app.utils.guvi_handler.

	return actions

	async def rebuild_intelligence_baseline(self, session_id: str) -> None:
	"""
	Rebuild advanced threat intelligence for a session from its history.
	Use this after cold restarts when history is provided by an external source.
	OPTIMIZED: Uses heuristic detection to avoid wasting API calls on historical data.
	"""
	conv = await self.conversation_manager.get(session_id)
	if not conv or not conv.get("history"):
	return

	self.logger.info(f"Rebuilding intelligence baseline for session {session_id}")
	history = conv["history"]

	# 1. Use HEURISTIC detection on first message (no API call)
	# Full LLM detection is wasteful for history reconstruction
	if not conv.get("scam_type") and history:
	first_msg = history[0].get("scammer_message", "")
	if first_msg:
	# Use fast heuristic instead of full LLM detection
	detection = self.scam_detector.detect_heuristic(first_msg)
	if detection.get("confidence", 0) > 0.3:
	await self.conversation_manager.update_intelligence(session_id, {
	"scam_type": detection.get("scam_type", "unknown"),
	"scam_confidence": detection.get("confidence", 0.5)
	})

	# 2. Re-sync Graph Intel & Campaigns for all intel
	agg_intel = conv.get("aggregated_intelligence", {})
	if agg_intel:
	graph_intel.add_intelligence(session_id, agg_intel)
	if self.campaign_tracker and conv.get("scam_type"):
	# Deterministic campaign ID from existing intel
	lookup = (agg_intel.get("phone_numbers") or ["unknown"])[0]
	self.campaign_tracker.track(f"rebuild_{session_id}", conv["scam_type"], agg_intel)

	async def get_statistics(self) -> Dict[str, Any]:
	"""Get system statistics."""
	stats = await self.conversation_manager.get_statistics()
	if self.campaign_tracker:
	stats["campaigns"] = self.campaign_tracker.get_all_campaigns()
	if self.police_api:
	stats["reports_filed"] = len(self.police_api.reports)
	return stats

	def get_last_trace(self) -> Dict[str, Any]:
	"""Get the latest neuro-symbolic execution trace."""
	return self.last_trace

	async def shutdown(self) -> None:
	if self.llm_client:
	await self.llm_client.close()
	self.logger.info("Orchestrator shutdown complete")


	# Global orchestrator instance
	orchestrator = HoneypotOrchestrator()


	__all__ = ["HoneypotOrchestrator", "orchestrator"]