Upload folder using huggingface_hub

960ec3d verified 2 months ago

50 kB

	# Spam Email Classifier with XAI Explanations
	# ENGT 375 Project - Spring 2026 - ODU
	# Uses LIME, SHAP, ELI5, and Ollama/Qwen 3.5 (2b) for explanations

	import os
	import streamlit as st
	import numpy as np
	import pandas as pd
	import joblib
	import re
	import json
	import requests
	import shutil
	import matplotlib.pyplot as plt
	import matplotlib.colors as mcolors
	import shap
	import lime
	import lime.lime_tabular
	import eli5
	from pathlib import Path
	# I use sparse matrices here because TF-IDF creates a huge matrix and
	# converting to dense would use way too much memory (found this on Stack Overflow)
	from scipy.sparse import hstack, csr_matrix
	from utils_student import (preprocess_text, compute_metadata_features,
	spam_context_phrases, ham_context_phrases,
	registration_phrases, url_shorteners,
	legitimate_platforms, OLLAMA_API, LLM_FEATURE_NAMES)

	# Project directories
	PROJECT_DIR = Path(__file__).parent
	MODELS_DIR = PROJECT_DIR / 'models'

	# Trusted domain whitelist (app-specific, not shared)
	trusted_domains = {'.gov', '.mil', '.edu', 'govdelivery.com', 'granicus.com'}

	# I used JavaScript here because Streamlit doesn't save settings between sessions
	# by default - streamlit_js_eval lets me store the classification results in the
	# browser's localStorage so they persist when the page refreshes
	from streamlit_js_eval import streamlit_js_eval

	STORAGE_KEY = "spam_xai_state"


	def _make_serializable(obj):
	"""Convert numpy arrays and other non-JSON types to serializable forms."""
	if isinstance(obj, np.ndarray):
	return obj.tolist()
	if isinstance(obj, np.integer):
	return int(obj)
	if isinstance(obj, np.floating):
	return float(obj)
	if isinstance(obj, dict):
	return {k: _make_serializable(v) for k, v in obj.items()}
	if isinstance(obj, (list, tuple)):
	return [_make_serializable(item) for item in obj]
	return obj


	def save_to_local_storage(data: dict):
	"""Serialize and save state to browser localStorage."""
	serializable = _make_serializable(data)
	payload = json.dumps(serializable)
	js = "localStorage.setItem('%s', JSON.stringify(%s))" % (STORAGE_KEY, payload)
	streamlit_js_eval(js_expressions=js, key="save_%d" % hash(payload))


	def load_from_local_storage():
	"""Load state from browser localStorage. Returns dict or None."""
	result = streamlit_js_eval(
	js_expressions="localStorage.getItem('%s')" % STORAGE_KEY,
	key="load_state"
	)
	if result:
	try:
	return json.loads(result)
	except (json.JSONDecodeError, ValueError):
	return None
	return None


	def clear_local_storage():
	"""Remove saved state from localStorage."""
	streamlit_js_eval(
	js_expressions="localStorage.removeItem('%s')" % STORAGE_KEY,
	key="clear_state"
	)


	def save_feedback(email_text, predicted_label, correct_label, spam_prob, notes, feedback_type):
	"""Save feedback to CSV and return total row count."""
	import csv, datetime
	feedback_dir = Path(__file__).parent / 'data' / 'feedback'
	feedback_dir.mkdir(parents=True, exist_ok=True)
	feedback_file = feedback_dir / 'feedback_log.csv'
	file_exists = feedback_file.exists()
	with open(feedback_file, 'a', newline='', encoding='utf-8') as f:
	writer = csv.writer(f)
	if not file_exists:
	writer.writerow(['timestamp', 'email_text', 'predicted_label', 'correct_label',
	'spam_prob', 'user_notes', 'feedback_type'])
	writer.writerow([
	datetime.datetime.now().isoformat(),
	email_text[:2000], predicted_label, correct_label,
	'%.4f' % spam_prob, notes, feedback_type
	])
	row_count = sum(1 for _ in open(feedback_file, encoding='utf-8')) - 1
	return row_count


	def extract_llm_features_single(text, model_name='qwen3.5:2b'):
	"""Extract intent and tone features for a single email via Ollama."""
	truncated = text[:500]
	prompt = (
	'Rate this email on these dimensions (0.0 to 1.0).\n'
	'Respond with ONLY valid JSON: {"promotional": X, "transactional": X, '
	'"personal": X, "phishing": X, "urgency": X, "formality": X}\n'
	'/no_think\n\n'
	'Email: "%s"' % truncated
	)
	try:
	resp = requests.post(OLLAMA_API, json={
	'model': model_name,
	'messages': [{'role': 'user', 'content': prompt}],
	'stream': False,
	'think': False,
	'options': {'temperature': 0.1, 'num_predict': 100}
	}, timeout=30)
	if resp.status_code == 200:
	content = resp.json().get('message', {}).get('content', '')
	content = re.sub(r'<think>.*?</think>', '', content, flags=re.DOTALL).strip()
	json_match = re.search(r'\{[^}]+\}', content)
	if json_match:
	data = json.loads(json_match.group())
	return np.array([
	float(data.get('promotional', 0.5)),
	float(data.get('transactional', 0.5)),
	float(data.get('personal', 0.5)),
	float(data.get('phishing', 0.5)),
	float(data.get('urgency', 0.5)),
	float(data.get('formality', 0.5)),
	]).reshape(1, -1)
	except Exception:
	pass
	return np.full((1, 6), 0.5)


	def _deserialize_results(data):
	"""Convert lists back to numpy arrays for results dict."""
	if data is None:
	return None
	for key in ('proba', 'original_proba', 'sv', 'meta'):
	if key in data and isinstance(data[key], list):
	data[key] = np.array(data[key])
	if 'top_idx' in data and isinstance(data['top_idx'], list):
	data['top_idx'] = np.array(data['top_idx'], dtype=int)
	return data

	# Example emails for testing
	EXAMPLE_EMAILS = {
	"Spam: Nigerian Prince": """Subject: URGENT - You Have Won $5,000,000!!!

	Dear Friend,

	CONGRATULATIONS!!! You have been selected as the winner of our international lottery program!!!
	To claim your $5,000,000 USD prize, click the link below IMMEDIATELY and provide your bank details.

	ACT NOW - This offer expires in 24 hours!!!

	Click here: http://totally-legit-prize.com/claim
	Send $500 processing fee to unlock your winnings.

	Best regards,
	Dr. Prince Mohammed""",
	"Spam: Viagra Ad": """Subject: Best prices on V1AGRA and C1ALIS!!!

	$$$ SAVE BIG $$$
	Buy now and get 80% OFF!!!
	No prescription needed! Free shipping!
	Order at http://cheap-pharma-deals.com

	LIMITED TIME OFFER - ACT NOW!
	Subscribe to our mailing list for more deals!""",
	"Ham: Meeting Invite": """Subject: Team sync Thursday 2pm

	Hi everyone,

	Just a reminder that we have our weekly team sync this Thursday at 2pm in Conference Room B.

	Agenda:
	- Sprint review
	- Q2 planning discussion
	- New hire onboarding update

	Please come prepared with your status updates. If you can't make it, let me know and I'll share the notes.

	Thanks,
	Sarah""",
	"Ham: Tech Discussion": """Subject: Re: Python 3.12 upgrade

	Hey Mike,

	I tested the upgrade on our staging environment yesterday. Everything looks good except for one
	deprecation warning in the logging module. I've already submitted a PR to fix it.

	The new pattern matching syntax is really nice for our parser module. Want to pair on refactoring
	that section next week?

	Also, did you see the new asyncio improvements? Could simplify our event loop code significantly.

	Cheers,
	Dave""",
	"Ham: Family Email": """Subject: Thanksgiving dinner plans

	Hi everyone!

	Hope you're all doing well. I wanted to start planning for Thanksgiving dinner this year.

	Mom and Dad said they can host again. I was thinking we could do a potluck style - I'll bring
	the turkey and stuffing, and everyone else can sign up for sides and desserts.

	Can everyone reply with what they'd like to bring? Also let me know if you have any dietary
	restrictions I should know about.

	Love,
	Jenny"""
	}


	# Check if the sender domain is in our trusted list (.gov, .edu, etc.)
	# I added this because government and university emails were getting flagged as spam
	def check_domain_trust(email_text):
	# Extract email addresses from From: headers or general text
	from_match = re.search(r'(?:From\|Return-Path\|Sender):\s.?([a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,})', email_text, re.IGNORECASE)
	if not from_match:
	# Fallback: any email address in the text
	email_match = re.search(r'[a-zA-Z0-9._%+-]+@([a-zA-Z0-9.-]+\.[a-zA-Z]{2,})', email_text)
	if email_match:
	domain = email_match.group(1).lower()
	else:
	return {'trusted': False, 'domain': None, 'match': None}
	else:
	domain = from_match.group(1).split('@')[-1].lower()

	for t in trusted_domains:
	if domain.endswith(t.lstrip('.')):
	return {'trusted': True, 'domain': domain, 'match': t}

	return {'trusted': False, 'domain': domain, 'match': None}


	# Detect email header signals for post-classification adjustment
	# I learned about these email headers from reading about how Gmail filters work
	def extract_header_features(text):
	features = {}

	# List-Unsubscribe header - legitimate newsletters include this so users
	# can unsubscribe (spammers usually don't bother adding it)
	features['has_list_unsubscribe'] = bool(re.search(r'List-Unsubscribe:', text, re.IGNORECASE))

	# Sender domain checks
	from_match = re.search(r'(?:From\|Return-Path\|Sender):\s.?@([a-zA-Z0-9.-]+\.[a-zA-Z]{2,})', text, re.IGNORECASE)
	sender_domain = from_match.group(1).lower() if from_match else ''
	features['sender_is_gov'] = sender_domain.endswith('.gov') or sender_domain.endswith('.mil')

	# Authentication results
	features['has_spf_pass'] = bool(re.search(r'spf=pass', text, re.IGNORECASE))
	features['has_dkim_pass'] = bool(re.search(r'dkim=pass', text, re.IGNORECASE))

	return features


	# Load the trained model and supporting files
	# I load all the XAI libraries and model files here at startup - caching them with
	# @st.cache_resource means they stay in memory so every classification is fast
	@st.cache_resource
	def load_model():
	print('Loading the trained model...')
	model = joblib.load(MODELS_DIR / 'random_forest_spam.joblib')
	vectorizer = joblib.load(MODELS_DIR / 'tfidf_vectorizer.joblib')
	feature_names = joblib.load(MODELS_DIR / 'feature_names.joblib')
	training_sample_path = MODELS_DIR / 'training_sample.joblib'
	training_sample = joblib.load(training_sample_path) if training_sample_path.exists() else None
	# I need the raw RF model separately because SHAP and ELI5 can't work
	# with the calibrated wrapper - they need to see the actual tree structure
	raw_rf_path = MODELS_DIR / 'random_forest_raw.joblib'
	raw_rf = joblib.load(raw_rf_path) if raw_rf_path.exists() else model
	# Load optimal threshold if available
	threshold_path = MODELS_DIR / 'optimal_threshold.joblib'
	optimal_threshold = joblib.load(threshold_path) if threshold_path.exists() else 0.60
	# Load training config (tracks whether LLM features were used)
	config_path = MODELS_DIR / 'training_config.joblib'
	training_config = joblib.load(config_path) if config_path.exists() else {'llm_features_used': False}
	# Load metadata scaler if available
	scaler_path = MODELS_DIR / 'meta_scaler.joblib'
	meta_scaler = joblib.load(scaler_path) if scaler_path.exists() else None
	print('Done!')
	return model, vectorizer, feature_names, training_sample, raw_rf, optimal_threshold, training_config, meta_scaler


	# Cache LIME explainer so it's not recreated on every classification
	@st.cache_resource
	def get_lime_explainer(_training_data, feature_names):
	# LIME needs a sample of training data to understand what "normal" looks like
	# so it can measure how much each word changes the prediction
	print('Creating LIME explainer (cached)...')
	return lime.lime_tabular.LimeTabularExplainer(
	training_data=_training_data,
	feature_names=feature_names,
	class_names=['Ham', 'Spam'],
	mode='classification'
	)


	# Cache SHAP explainer so it's not recreated on every classification
	@st.cache_resource
	def get_shap_explainer(_raw_rf):
	# I use TreeExplainer because it's designed specifically for tree-based models
	# like Random Forest - it's much faster than the generic KernelExplainer
	print('Creating SHAP TreeExplainer (cached)...')
	return shap.TreeExplainer(_raw_rf)


	def check_ollama():
	# Check if Ollama is running - prefer qwen3.5:2b, fall back to qwen3.5, then gemma3
	try:
	resp = requests.get('http://localhost:11434/api/tags', timeout=2)
	if resp.status_code == 200:
	models = [m['name'] for m in resp.json().get('models', [])]
	preferred = [m for m in models if 'qwen3.5:2b' in m]
	fallback_qwen = [m for m in models if 'qwen3.5' in m]
	fallback_gemma = [m for m in models if 'gemma3' in m]
	return preferred or fallback_qwen or fallback_gemma
	return []
	except Exception:
	return []


	def get_llm_explanation(email_text, label, confidence, proba,
	lime_features, shap_features, eli5_features, model_name):
	# Get natural language explanation from Ollama Qwen 3.5
	print('Running LLM explanation...')
	truncated = email_text[:500] + ('...' if len(email_text) > 500 else '')

	spam_or_not = "spam" if label == "SPAM" else "NOT spam"

	lime_part = ', '.join([f'{name} ({weight:+.3f})' for name, weight in lime_features[:5]])
	shap_part = ', '.join([f'{name} ({val:+.3f})' for name, val in shap_features[:5]])
	eli5_part = ', '.join([str(name) for name in eli5_features[:5]])

	prompt = (
	f'FACT: This email has been classified as {label} with {confidence * 100:.1f}% confidence.\n'
	f'Your job is to explain WHY it is {label}, not to reclassify it.\n'
	f'Ham probability: {proba[0] * 100:.1f}% \| Spam probability: {proba[1] * 100:.1f}%\n\n'
	f'Email (truncated): "{truncated}"\n\n'
	f'Top features driving this decision:\n'
	f'- LIME: {lime_part}\n'
	f'- SHAP: {shap_part}\n'
	f'- ELI5: {eli5_part}\n\n'
	f'You are an email security analyst explaining this to a non-technical user.\n'
	f'Do NOT contradict the classification. The email IS {spam_or_not}.\n\n'
	f'In 3-5 sentences, explain why this email is {label}. '
	f'Reference specific words or patterns from the email. '
	f'Do not use technical jargon like "TF-IDF" or "SHAP values". /no_think'
	)

	try:
	resp = requests.post(OLLAMA_API, json={
	'model': model_name,
	'messages': [{'role': 'user', 'content': prompt}],
	'stream': False,
	'think': False,
	'options': {'temperature': 0.3, 'num_predict': 300}
	}, timeout=120)
	if resp.status_code == 200:
	content = resp.json().get('message', {}).get('content', '')
	# Strip any residual thinking tags
	content = re.sub(r'<think>.*?</think>', '', content, flags=re.DOTALL).strip()
	print('Done!')
	return content or 'No response generated.'
	return 'Ollama error: HTTP %d' % resp.status_code
	except (requests.RequestException, ValueError) as e:
	return 'Could not connect to Ollama (%s). Make sure it is running (ollama serve).' % e


	# Ask LLM to classify email and provide second opinion
	def get_llm_second_opinion(email_text, rf_spam_prob, model_name, domain_info=None):
	print('Running LLM second opinion...')
	truncated = email_text[:1000] + ('...' if len(email_text) > 1000 else '')

	domain_hint = ""
	if domain_info and domain_info.get('trusted'):
	domain_hint = f'\nIMPORTANT: This email is from {domain_info["domain"]} ({domain_info["match"]} domain). Government, military, and educational emails are almost always legitimate.\n'

	prompt = (
	f'Classify this email as spam or ham (legitimate). Most emails are legitimate.\n'
	f'{domain_hint}\n'
	f'HAM examples: newsletters, order confirmations, bank alerts, church emails, subscription updates, gaming notifications, shipping alerts.\n'
	f'SPAM examples: prize scams, phishing for passwords, fake invoices, Nigerian prince schemes.\n\n'
	f'If unsure, choose ham. False positives are worse than false negatives.\n\n'
	f'Email: "{truncated}"\n\n'
	f'Reply with ONLY this JSON format:\n'
	f'{{"classification": "ham", "confidence": 0.85, "reason": "why"}}\n'
	f'or\n'
	f'{{"classification": "spam", "confidence": 0.95, "reason": "why"}}\n'
	f'/no_think'
	)

	try:
	resp = requests.post(OLLAMA_API, json={
	'model': model_name,
	'messages': [{'role': 'user', 'content': prompt}],
	'stream': False,
	'think': False,
	'options': {'temperature': 0.1, 'num_predict': 150}
	}, timeout=60)
	if resp.status_code == 200:
	content = resp.json().get('message', {}).get('content', '')
	content = re.sub(r'<think>.*?</think>', '', content, flags=re.DOTALL).strip()
	# Extract JSON from response - try json.loads first, regex fallback
	data = None
	try:
	data = json.loads(content)
	except (json.JSONDecodeError, ValueError):
	json_match = re.search(r'\{.*\}', content, re.DOTALL)
	if json_match:
	try:
	data = json.loads(json_match.group())
	except (json.JSONDecodeError, ValueError):
	pass
	if data:
	classification = data.get('classification', '').lower().strip()
	llm_conf = float(data.get('confidence', 0.5))
	reason = data.get('reason', '')
	llm_spam_prob = llm_conf if classification == 'spam' else (1 - llm_conf)
	print('Done!')
	return {'spam_prob': llm_spam_prob, 'classification': classification,
	'confidence': llm_conf, 'reason': reason}
	except Exception:
	pass
	return None


	# Apply theme colors to a matplotlib figure and axes
	def apply_figure_theme(fig, ax, theme):
	fig.patch.set_facecolor(theme['ax_facecolor'])
	ax.set_facecolor(theme['ax_facecolor'])
	ax.title.set_color(theme['text_color'])
	ax.xaxis.label.set_color(theme['text_color'])
	ax.yaxis.label.set_color(theme['text_color'])
	ax.tick_params(colors=theme['text_color'])
	for spine in ax.spines.values():
	spine.set_edgecolor(theme['grid_color'])


	# Page config
	st.set_page_config(page_title="Spam Classifier + XAI", layout="wide",
	page_icon="@", initial_sidebar_state="expanded")

	# Restore state from localStorage on page refresh
	if 'results' not in st.session_state:
	if st.session_state.pop('_skip_restore', False):
	# Reset was just triggered — clear localStorage now (JS actually executes on this rerun)
	clear_local_storage()
	else:
	stored = load_from_local_storage()
	if stored:
	restored_results = _deserialize_results(stored.get('results'))
	if restored_results:
	st.session_state['results'] = restored_results
	if stored.get('email_input'):
	st.session_state['email_input'] = stored['email_input']
	if 'dark_mode' in stored:
	st.session_state['dark_mode'] = stored['dark_mode']
	if 'reset_counter' in stored:
	st.session_state['reset_counter'] = stored['reset_counter']
	if 'threshold' in stored:
	st.session_state['saved_threshold'] = stored['threshold']

	# Dark mode toggle setup
	if 'dark_mode' not in st.session_state:
	st.session_state['dark_mode'] = False
	dark_mode = st.session_state['dark_mode']
	THEME = {
	'spam_color': '#ff6b6b' if dark_mode else '#c62828',
	'ham_color': '#69db7c' if dark_mode else '#2e7d32',
	'spam_bg': '#3d1515' if dark_mode else '#ffebee',
	'ham_bg': '#153d1a' if dark_mode else '#e8f5e9',
	'metric_bg': '#2d2d2d' if dark_mode else '#f0f2f6',
	'text_color': '#e0e0e0' if dark_mode else '#1a1a1a',
	'ax_facecolor': '#1e1e1e' if dark_mode else '#ffffff',
	'axvline_color': '#aaaaaa' if dark_mode else '#333333',
	'bar_spam': '#ff6b6b' if dark_mode else '#e74c3c',
	'bar_ham': '#69db7c' if dark_mode else '#2ecc71',
	'bar_edge': '#666666' if dark_mode else '#333333',
	'grid_color': '#444444' if dark_mode else '#cccccc',
	'gauge_ham': '#69db7c' if dark_mode else '#4CAF50',
	'gauge_spam': '#ff6b6b' if dark_mode else '#f44336',
	}

	# Build dark mode CSS string
	_dark_css = ""
	if dark_mode:
	_dark_css = """
	/* Full-page dark mode overrides */
	.stApp, .stApp > header, [data-testid='stAppViewContainer'],
	[data-testid='stHeader'], section[data-testid='stSidebar'],
	section[data-testid='stSidebar'] > div {
	background-color: #1a1a2e !important;
	color: #e0e0e0 !important;
	}
	section[data-testid='stSidebar'] {
	background-color: #16213e !important;
	}
	.stApp h1, .stApp h2, .stApp h3, .stApp h4, .stApp p,
	.stApp label, .stApp span, .stApp div,
	[data-testid='stMarkdownContainer'], [data-testid='stMarkdownContainer'] p,
	[data-testid='stMarkdownContainer'] h1, [data-testid='stMarkdownContainer'] h2,
	[data-testid='stMarkdownContainer'] h3, [data-testid='stMarkdownContainer'] h4 {
	color: #e0e0e0 !important;
	}
	div[data-testid='stMetric'] label,
	div[data-testid='stMetric'] [data-testid='stMetricValue'],
	div[data-testid='stMetric'] [data-testid='stMetricLabel'] {
	color: #e0e0e0 !important;
	}
	.stTabs [data-baseweb='tab'] {
	color: #b0b0b0 !important;
	}
	.stTabs [data-baseweb='tab'][aria-selected='true'] {
	color: #ff6b6b !important;
	}
	.stTextArea textarea, [data-baseweb='textarea'] textarea {
	background-color: #0f3460 !important;
	color: #e0e0e0 !important;
	border-color: #333 !important;
	}
	.stButton button:not([data-testid='stBaseButton-primary']) {
	background-color: #16213e !important;
	color: #e0e0e0 !important;
	border-color: #444 !important;
	}
	[data-testid='stExpander'] {
	background-color: #16213e !important;
	border-color: #333 !important;
	}
	hr { border-color: #333 !important; }
	[data-testid='stSlider'] p { color: #b0b0b0 !important; }
	pre, code, .stCodeBlock { color: #e0e0e0 !important; background-color: #1e1e2e !important; }
	.stJson { color: #e0e0e0 !important; background-color: #1e1e2e !important; }
	[data-testid='stExpander'] pre { background-color: #1e1e2e !important; }
	div[data-baseweb='popover'] > div,
	div[data-baseweb='tooltip'] > div {
	background-color: #16213e !important;
	color: #e0e0e0 !important;
	}
	"""

	st.markdown("""
	<style>
	.stTabs [data-baseweb="tab-list"] { gap: 8px; }
	.stTabs [data-baseweb="tab"] {
	padding: 8px 20px;
	border-radius: 8px 8px 0 0;
	font-weight: 600;
	}
	div[data-testid="stMetric"] {
	background-color: """ + THEME['metric_bg'] + """;
	border-radius: 10px;
	padding: 15px;
	border-left: 4px solid #4CAF50;
	}
	.big-result {
	font-size: 1.5em;
	font-weight: bold;
	padding: 10px 20px;
	border-radius: 10px;
	text-align: center;
	margin-top: 8px;
	margin-bottom: 8px;
	}
	.spam-result { background-color: """ + THEME['spam_bg'] + """; color: """ + THEME['spam_color'] + """; border: 2px solid """ + THEME['spam_color'] + """; }
	.ham-result { background-color: """ + THEME['ham_bg'] + """; color: """ + THEME['ham_color'] + """; border: 2px solid """ + THEME['ham_color'] + """; }
	.trust-badge { background-color: #1565c0; color: white; padding: 4px 12px; border-radius: 20px; font-size: 0.85em; display: inline-block; margin: 4px 0; }
	[data-testid="stHorizontalBlock"] code {
	word-break: break-all;
	white-space: pre-wrap;
	}
	[data-testid="stHorizontalBlock"] p {
	word-wrap: break-word;
	overflow-wrap: break-word;
	}
	""" + _dark_css + """
	</style>
	""", unsafe_allow_html=True)

	# Load model
	try:
	model, vectorizer, feature_names, training_sample, raw_rf, saved_threshold, training_config, meta_scaler = load_model()
	except FileNotFoundError:
	st.error("Model files not found. Please run the notebook or `python retrain.py` first.")
	st.stop()

	# Sidebar
	with st.sidebar:
	st.toggle("Dark Mode", key='dark_mode')
	if st.button("New Classification", use_container_width=True):
	old_counter = st.session_state.get('reset_counter', 0)
	st.session_state.pop('results', None)
	st.session_state.pop('email_input', None)
	st.session_state.pop('feedback_given', None)
	st.session_state.pop('feedback_wrong', None)
	st.session_state.pop('feedback_saved', None)
	st.session_state.pop('feedback_msg', None)
	st.session_state.pop('email_textarea_%d' % old_counter, None)
	st.session_state['reset_counter'] = old_counter + 1
	st.session_state['_skip_restore'] = True
	st.rerun()
	st.markdown("---")
	st.header("Spam Classifier + XAI")
	st.caption("ENGT 375 \| Spring 2026 \| ODU")
	st.markdown("---")

	# Classification threshold slider
	# The threshold slider lets users adjust how cautious the classifier is -
	# higher threshold = fewer false spam flags but might miss some real spam
	default_threshold = st.session_state.pop('saved_threshold', None) or 0.60
	threshold = st.slider("Classification Threshold", 0.0, 1.0, float(default_threshold), 0.05,
	help="Emails with spam probability above this threshold are classified as spam. Default 0.60 to reduce false positives.")

	st.markdown("---")

	# Input mode selection
	input_mode = st.radio("Input Mode", ["Email Body Only", "Full Email with Headers"],
	help="Use 'Full Email with Headers' to get additional signals from email headers (List-Unsubscribe, SPF, DKIM).")

	st.markdown("---")

	# Example emails
	st.subheader("Example Emails")
	st.caption("Click to load a sample email")
	for name, text in EXAMPLE_EMAILS.items():
	if st.button(name, key="ex_%s" % name, use_container_width=True):
	st.session_state['email_input'] = text

	st.markdown("---")

	# How it works
	with st.expander("How It Works"):
	st.markdown("""
	1. Text Input
	- Paste email text directly, or upload an email screenshot (the app reads text from images)

	2. Text Cleanup
	- Strips out HTML code, web links, and email addresses
	- Converts everything to lowercase and reduces words to their root form (e.g., "running" -> "run")
	- Removes common filler words like "the", "is", "and"

	3. Feature Extraction
	- Word Importance (3000 words/phrases) — measures how important each word or phrase is compared to all emails the model has seen
	- Email Patterns (24 measurements) — things like how many exclamation marks, ALL CAPS words, links, dollar signs, and spam-like phrases appear
	- AI Analysis (6 scores, if available) — a language model rates the email's intent (promotional, personal, phishing) and tone (urgency, formality)

	4. Decision Forest Classifier
	- Hundreds of decision trees that each vote on spam vs. ham — the majority wins
	- Trained on ~70,000 emails from multiple sources
	- The model automatically adjusts for uneven spam/ham ratios and fine-tunes its confidence scores
	- Best settings found by testing many combinations automatically (GridSearchCV)

	5. Domain Trust
	- Emails from .gov, .mil, and .edu domains are given the benefit of the doubt
	- Trusted senders are capped at 30% spam probability max

	6. Explainability (XAI)
	- LIME — hides different words and watches how the prediction changes to find which words matter most
	- SHAP — calculates how much each word or feature pushed the result toward spam or toward ham, like a tug-of-war score
	- ELI5 — looks inside the model to show which words it considers most important
	- AI Explanation — a language model summarizes the findings in everyday language
	""")

	# Ollama status
	qwen_models = check_ollama()
	if qwen_models:
	selected_model = st.selectbox("LLM Model", qwen_models, index=0)
	else:
	st.warning("Ollama not available - AI Explanation tab disabled")
	selected_model = None

	# Main area
	st.title("Spam Email Classifier with Explainable AI")
	st.markdown("Classify emails and understand why using LIME, SHAP, ELI5, and AI-powered explanations.")

	# Input text area
	default_text = st.session_state.get('email_input', '')
	counter = st.session_state.get('reset_counter', 0)
	email_text = st.text_area("Paste an email to classify:", value=default_text,
	height=200, placeholder="Paste email content here...",
	key="email_textarea_%d" % counter)

	classify_clicked = st.button("Classify", type="primary", use_container_width=True)

	if classify_clicked and email_text.strip():
	# Compute and cache all results
	with st.spinner("Classifying and computing XAI explanations..."):
	print('Running classification...')

	# Check domain trust BEFORE preprocessing
	domain_info = check_domain_trust(email_text)

	# Extract header features if full email mode
	header_features = {}
	if input_mode == "Full Email with Headers":
	header_features = extract_header_features(email_text)

	clean = preprocess_text(email_text)
	tfidf_features = vectorizer.transform([clean])
	meta_features = compute_metadata_features([email_text])

	# Apply metadata scaler if available (matches training normalization)
	if meta_scaler is not None:
	meta_features = meta_scaler.transform(meta_features)

	# Add LLM features if model was trained with them
	if training_config.get('llm_features_used'):
	if selected_model:
	llm_feats = extract_llm_features_single(email_text, model_name=selected_model)
	else:
	llm_feats = np.full((1, 6), 0.5) # neutral fallback if LLM is offline
	# Combine TF-IDF + metadata + LLM features into one feature vector
	# (same order as during training so the model gets the right inputs)
	X_input = hstack([tfidf_features, csr_matrix(meta_features), csr_matrix(llm_feats)]).toarray()
	else:
	X_input = hstack([tfidf_features, csr_matrix(meta_features)]).toarray()

	# Prediction
	proba = model.predict_proba(X_input)[0]

	# LLM scoring removed — small model confidence was static (~92-95%)
	# LLM still used for AI Explanation tab via get_llm_explanation()
	llm_second_opinion = None
	llm_weight_used = 0.0
	original_proba = proba.copy()

	# Domain trust cap - max 30% spam for trusted domains
	if domain_info.get('trusted'):
	if proba[1] > 0.30:
	proba = np.array([0.70, 0.30])

	# Header-based post-classification adjustment
	if header_features:
	adjustment = 0.0
	if header_features.get('has_list_unsubscribe'):
	adjustment = adjustment - 0.10 # Strong ham signal
	if header_features.get('sender_is_gov'):
	adjustment = adjustment - 0.15 # Government sender
	if header_features.get('has_spf_pass'):
	adjustment = adjustment - 0.03
	if header_features.get('has_dkim_pass'):
	adjustment = adjustment - 0.03
	if adjustment != 0.0:
	adjusted_spam = max(0.01, min(0.99, proba[1] + adjustment))
	proba = np.array([1 - adjusted_spam, adjusted_spam])

	# LIME explanation
	print('Running LIME explanation...')
	lime_training_data = training_sample if training_sample is not None else X_input
	explainer = get_lime_explainer(lime_training_data, feature_names)
	exp = explainer.explain_instance(X_input[0], raw_rf.predict_proba, num_features=10)
	label_to_explain = list(exp.as_map().keys())[0]
	feature_weights = exp.as_list(label=label_to_explain)
	print('Done!')

	# SHAP explanation - I have to use the raw RF here because SHAP's
	# TreeExplainer doesn't work with the calibrated model wrapper
	print('Running SHAP explanation...')
	shap_explainer = get_shap_explainer(raw_rf)
	shap_values = shap_explainer.shap_values(X_input, check_additivity=False)
	# SHAP returns different shapes depending on the version, so I have to
	# check which format it gives me (this took a while to debug)
	if isinstance(shap_values, list):
	sv = shap_values[1][0]
	elif shap_values.ndim == 3:
	sv = shap_values[0, :, 1]
	else:
	sv = shap_values[0]
	top_idx = np.argsort(np.abs(sv))[::-1][:10]
	print('Done!')

	# ELI5 explanation
	print('Running ELI5 explanation...')
	eli5_exp = eli5.explain_prediction(raw_rf, X_input[0], feature_names=feature_names, top=10)
	eli5_html = eli5.format_as_html(eli5_exp)
	eli5_text = eli5.format_as_text(
	eli5.explain_prediction(raw_rf, X_input[0], feature_names=feature_names, top=5)
	)
	eli5_top_exp = eli5.explain_prediction(raw_rf, X_input[0], feature_names=feature_names, top=5)
	eli5_feat_names = []
	if hasattr(eli5_top_exp, 'targets') and eli5_top_exp.targets:
	for fw in eli5_top_exp.targets[0].feature_weights.pos[:5]:
	eli5_feat_names.append(fw.feature)
	for fw in eli5_top_exp.targets[0].feature_weights.neg[:5]:
	eli5_feat_names.append(fw.feature)
	print('Done!')

	# AI Explanation (if Ollama available)
	# I send the XAI results to the LLM so it can explain them in plain English -
	# most people won't understand raw SHAP values or LIME weights
	ai_explanation = None
	if selected_model:
	lime_feats = [(f, w) for f, w in feature_weights[:5]]
	shap_feats = [(feature_names[i], float(sv[i])) for i in top_idx[:5]]
	prediction = 1 if proba[1] >= threshold else 0
	label = "SPAM" if prediction == 1 else "HAM"
	confidence = proba[prediction]
	ai_explanation = get_llm_explanation(
	email_text, label, confidence, proba,
	lime_feats, shap_feats, eli5_feat_names, selected_model
	)

	# Store everything in session state
	st.session_state['results'] = {
	'email_text': email_text,
	'clean': clean,
	'meta': compute_metadata_features([email_text])[0],
	'proba': proba,
	'original_proba': original_proba,
	'llm_second_opinion': llm_second_opinion,
	'domain_info': domain_info,
	'header_features': header_features,
	'feature_weights': feature_weights,
	'sv': sv,
	'top_idx': top_idx,
	'eli5_html': eli5_html,
	'eli5_text': eli5_text,
	'eli5_feat_names': eli5_feat_names,
	'ai_explanation': ai_explanation,
	'llm_weight_used': llm_weight_used,
	}

	# Persist to browser localStorage
	save_to_local_storage({
	'results': st.session_state['results'],
	'email_input': email_text,
	'dark_mode': st.session_state.get('dark_mode', False),
	'reset_counter': st.session_state.get('reset_counter', 0),
	'threshold': threshold,
	})

	elif classify_clicked:
	st.warning("Please paste an email to classify.")

	# Display results from session state (survives reruns)
	if 'results' in st.session_state:
	r = st.session_state['results']
	proba = r['proba']
	sv = r['sv']
	top_idx = r['top_idx']
	feature_weights = r['feature_weights']

	# Re-derive label from current threshold (so threshold slider changes take effect)
	prediction = 1 if proba[1] >= threshold else 0
	label = "SPAM" if prediction == 1 else "HAM"
	confidence = proba[prediction]

	# Domain trust badge
	domain_info = r.get('domain_info', {})
	if domain_info.get('trusted'):
	st.markdown(
	'<span class="trust-badge">Trusted Domain: %s (%s)</span>' % (domain_info["domain"], domain_info["match"]),
	unsafe_allow_html=True
	)

	# Header features info
	header_features = r.get('header_features', {})
	if header_features:
	header_signals = []
	if header_features.get('has_list_unsubscribe'):
	header_signals.append("Has unsubscribe link (legitimate mailing lists include this)")
	if header_features.get('sender_is_gov'):
	header_signals.append("Government sender domain")
	if header_features.get('has_spf_pass'):
	header_signals.append("SPF passed (sender's server is authorized)")
	if header_features.get('has_dkim_pass'):
	header_signals.append("DKIM passed (email signature verified)")
	if header_signals:
	st.info("Header signals: %s" % ' \| '.join(header_signals))

	# Preprocessing visualization
	with st.expander("Preprocessing Steps", expanded=False):
	col_a, col_b = st.columns(2)
	with col_a:
	st.markdown("Original Text (first 300 chars)")
	st.code(r['email_text'][:300] + ('...' if len(r['email_text']) > 300 else ''), language='text')
	with col_b:
	st.markdown("After Preprocessing (first 300 chars)")
	st.code(r['clean'][:300] + ('...' if len(r['clean']) > 300 else ''), language='text')

	meta_names = ['Exclamation Mark Density', 'Dollar Sign Count', 'ALL CAPS Word Ratio',
	'Spam Phrase Count', 'Ham Phrase Count', 'Spam vs. Ham Word Balance',
	'Link Count', 'HTML Code Tags', 'Email Length (chars)',
	'Avg Sentence Length', 'ALL CAPS Usage',
	'Mentions a Specific Date', 'Mentions a Specific Time', 'Date Reference Count',
	'Has Unsubscribe Link', 'Has Physical Address', 'Has Proper Greeting',
	'Has Contact Info', 'Sign-up/Register Language Score',
	'Sales Language vs. Info Ratio', 'Shortened Link Usage',
	'Known Platform Links', 'Gov/Edu Link Count',
	'Question Mark Count']
	st.markdown("Extracted Metadata Features:")
	meta_df = pd.DataFrame({'Feature': meta_names, 'Value': r['meta']})
	st.dataframe(meta_df, use_container_width=True, hide_index=True)

	# Display result
	st.markdown("---")
	col1, col2, col3 = st.columns([1.5, 1, 1.5])

	with col1:
	css_class = "spam-result" if prediction == 1 else "ham-result"
	st.markdown('<div class="big-result %s">%s</div>' % (css_class, label), unsafe_allow_html=True)

	with col2:
	st.metric("Confidence", "%.1f%%" % (confidence * 100))
	st.metric("Threshold", "%.0f%%" % (threshold * 100))

	with col3:
	# Confidence gauge using a horizontal bar
	fig_gauge, ax_gauge = plt.subplots(figsize=(4, 1.8))
	ax_gauge.barh([0], [proba[0]], color=THEME['gauge_ham'], height=0.5, label='Ham')
	ax_gauge.barh([0], [proba[1]], left=[proba[0]], color=THEME['gauge_spam'], height=0.5, label='Spam')
	ax_gauge.axvline(x=threshold, color=THEME['axvline_color'], linestyle='--', linewidth=2, label='Threshold (%.0f%%)' % (threshold * 100))
	ax_gauge.set_xlim(0, 1)
	ax_gauge.set_yticks([])
	ax_gauge.legend(loc='upper center', ncol=3, fontsize=6, bbox_to_anchor=(0.5, 1.4),
	facecolor=THEME['ax_facecolor'], labelcolor=THEME['text_color'])
	apply_figure_theme(fig_gauge, ax_gauge, THEME)
	fig_gauge.subplots_adjust(top=0.65, bottom=0.15)
	st.pyplot(fig_gauge, transparent=not dark_mode)
	plt.close()

	# XAI Explanations
	st.markdown("---")
	st.subheader("Explainable AI Analysis")

	tab_names = ["LIME", "SHAP", "ELI5", "Comparison"]
	if selected_model:
	tab_names.append("AI Explanation")

	tabs = st.tabs(tab_names)

	# LIME Tab
	with tabs[0]:
	st.markdown("#### LIME — What Words Mattered?")
	st.caption("LIME hides different words in the email and watches how the prediction changes — this reveals which words matter most.")

	features_sorted = sorted(feature_weights, key=lambda x: x[1])
	names_lime = [f[0] for f in features_sorted]
	weights_lime = [f[1] for f in features_sorted]

	fig, ax = plt.subplots(figsize=(8, 5))
	colors_bar = [THEME['bar_spam'] if w > 0 else THEME['bar_ham'] for w in weights_lime]
	ax.barh(names_lime, weights_lime, color=colors_bar, edgecolor=THEME['bar_edge'], alpha=0.85)
	ax.axvline(x=0, color=THEME['axvline_color'], linewidth=0.8)
	ax.set_title('LIME: Feature Contributions to Classification', fontsize=13, fontweight='bold')
	ax.set_xlabel('Bars pointing right \u2192 pushes toward SPAM \| Bars pointing left \u2192 pushes toward HAM')
	apply_figure_theme(fig, ax, THEME)
	plt.tight_layout()
	st.pyplot(fig, transparent=not dark_mode)
	plt.close()

	# SHAP Tab
	with tabs[1]:
	st.markdown("#### SHAP — Tug-of-War Scores")
	st.caption("SHAP calculates how much each word or feature pushed the result toward spam or toward ham — like a tug-of-war score.")

	top_features_shap = [feature_names[i] for i in top_idx]
	top_vals_shap = sv[top_idx]

	fig, ax = plt.subplots(figsize=(8, 5))
	colors_bar = [THEME['bar_spam'] if v > 0 else THEME['bar_ham'] for v in top_vals_shap]
	ax.barh(top_features_shap[::-1], top_vals_shap[::-1],
	color=colors_bar[::-1], edgecolor=THEME['bar_edge'], alpha=0.85)
	ax.axvline(x=0, color=THEME['axvline_color'], linewidth=0.8)
	ax.set_title('SHAP: Top Feature Contributions', fontsize=13, fontweight='bold')
	ax.set_xlabel('Bars pointing right \u2192 pushes toward SPAM \| Bars pointing left \u2192 pushes toward HAM')
	apply_figure_theme(fig, ax, THEME)
	plt.tight_layout()
	st.pyplot(fig, transparent=not dark_mode)
	plt.close()

	# ELI5 Tab
	with tabs[2]:
	st.markdown("#### ELI5 — Model's Own Rankings")
	st.caption("ELI5 looks inside the model to show which words it considers most important for its decision.")
	eli5_html = r['eli5_html']
	if dark_mode:
	eli5_html = '<div style="background:#fff;color:#000;padding:8px;border-radius:6px;">%s</div>' % eli5_html
	st.components.v1.html(eli5_html, height=400, scrolling=True)
	if dark_mode:
	st.caption("ELI5 uses its own styling - shown with light background for readability.")

	# Comparison Tab
	with tabs[3]:
	st.markdown("#### Side-by-Side Comparison")
	st.caption("If multiple tools agree a word is important, that's a stronger signal it actually matters.")
	col1, col2, col3 = st.columns(3)

	with col1:
	st.markdown("##### LIME Top 5")
	for feat, w in feature_weights[:5]:
	direction = "spam" if w > 0 else "ham"
	color = THEME['spam_color'] if w > 0 else THEME['ham_color']
	display_feat = feat[:20] + "..." if len(feat) > 20 else feat
	st.markdown("- <span style='color:%s'>`%s`</span> -> %s (%+.3f)" % (color, display_feat, direction, w),
	unsafe_allow_html=True)

	with col2:
	st.markdown("##### SHAP Top 5")
	for i in top_idx[:5]:
	direction = "spam" if sv[i] > 0 else "ham"
	color = THEME['spam_color'] if sv[i] > 0 else THEME['ham_color']
	display_feat = feature_names[i][:20] + "..." if len(feature_names[i]) > 20 else feature_names[i]
	st.markdown("- <span style='color:%s'>`%s`</span> -> %s (%+.3f)" % (color, display_feat, direction, sv[i]),
	unsafe_allow_html=True)

	with col3:
	st.markdown("##### ELI5 Top 5")
	for feat_name in r['eli5_feat_names'][:5]:
	display_feat = feat_name[:20] + "..." if len(feat_name) > 20 else feat_name
	st.markdown("- `%s`" % display_feat)

	# Feature agreement analysis
	st.markdown("---")
	st.markdown("##### Feature Agreement")
	lime_top = set(f[0] for f in feature_weights[:10])
	shap_top = set(feature_names[i] for i in top_idx[:10])
	overlap = lime_top & shap_top
	st.markdown("LIME-SHAP overlap (top 10): %d shared features" % len(overlap))
	if overlap:
	st.markdown("Shared: %s" % ', '.join('`%s`' % f for f in sorted(overlap)))

	# AI Explanation Tab
	if selected_model:
	with tabs[4]:
	st.markdown("#### AI-Powered Explanation")
	st.caption("Using %s via Ollama to explain the classification in plain English." % selected_model)

	if r['ai_explanation']:
	st.info(r['ai_explanation'])
	else:
	st.warning("AI explanation was not generated for this classification.")

	lime_feats = [(f, w) for f, w in feature_weights[:5]]
	shap_feats = [(feature_names[i], float(sv[i])) for i in top_idx[:5]]
	with st.expander("XAI Data Sent to LLM"):
	st.json({
	'prediction': label,
	'confidence': "%.1f%%" % (confidence * 100),
	'ham_prob': "%.1f%%" % (proba[0] * 100),
	'spam_prob': "%.1f%%" % (proba[1] * 100),
	'lime_top5': [{'feature': f, 'weight': round(w, 4)} for f, w in lime_feats],
	'shap_top5': [{'feature': f, 'value': round(v, 4)} for f, v in shap_feats],
	'eli5_top5': r['eli5_feat_names'][:5]
	})

	# Feedback section
	# The feedback system lets users correct wrong predictions, and those corrections
	# get saved so the model can learn from its mistakes when retrained
	st.markdown("---")
	st.markdown("### Was this classification correct?")

	if not st.session_state.get('feedback_given'):
	fb_col1, fb_col2 = st.columns(2)
	with fb_col1:
	if st.button("Yes, correct!", use_container_width=True, type="primary"):
	prediction = 1 if r['proba'][1] >= threshold else 0
	predicted_label = "spam" if prediction == 1 else "ham"
	count = save_feedback(r['email_text'], predicted_label, predicted_label,
	r['proba'][1], '', 'correct')
	st.session_state['feedback_given'] = True
	st.session_state['feedback_msg'] = (
	"Feedback saved! Classified as %s confirmed correct. %d entries logged so far."
	% (predicted_label.upper(), count))
	st.rerun()
	with fb_col2:
	if st.button("No, it's wrong!", use_container_width=True):
	st.session_state['feedback_wrong'] = True
	st.session_state['feedback_given'] = True
	st.rerun()

	if st.session_state.get('feedback_wrong') and not st.session_state.get('feedback_saved'):
	prediction = 1 if r['proba'][1] >= threshold else 0
	predicted_label = "spam" if prediction == 1 else "ham"
	correct_label = "ham" if predicted_label == "spam" else "spam"
	st.warning("Predicted: %s \| Correct: %s" % (predicted_label.upper(), correct_label.upper()))
	user_notes = st.text_input("Optional notes (e.g., 'Steam notification'):", key="feedback_notes")
	if st.button("Save Correction", type="primary"):
	count = save_feedback(r['email_text'], predicted_label, correct_label,
	r['proba'][1], user_notes, 'incorrect')
	st.session_state['feedback_saved'] = True
	st.session_state['feedback_msg'] = (
	"Feedback saved! Predicted %s → Correct %s. %d entries logged so far."
	% (predicted_label.upper(), correct_label.upper(), count))
	st.rerun()

	if st.session_state.get('feedback_msg'):
	st.success(st.session_state['feedback_msg'])

	# Footer
	st.markdown("---")
	st.caption("ENGT 375 Project - Spam Classification with XAI \| Random Forest + LIME + SHAP + ELI5 + Ollama LLM")