Spaces:

akryldigital
/

audit_assistant

Running on T4

App Files Files Community

audit_assistant / app.py

akryldigital

add % | absolute scores for V1

b6f2f7a verified about 2 months ago

raw

history blame contribute delete

84.1 kB

	"""
	Intelligent Audit Report Chatbot UI
	"""

	import os
	import warnings

	# Silence Streamlit deprecation warnings (use_column_width -> use_container_width)
	warnings.filterwarnings("ignore", message=".use_column_width.")
	warnings.filterwarnings("ignore", category=DeprecationWarning, module="streamlit")

	import time
	import json
	import uuid
	import logging
	import traceback
	from pathlib import Path

	from collections import Counter
	from typing import List, Dict, Any, Optional


	import pandas as pd
	import streamlit as st
	import plotly.express as px
	from langchain_core.messages import HumanMessage, AIMessage


	from src.agents import (
	get_multi_agent_chatbot,
	get_smart_chatbot,
	get_gemini_chatbot,
	get_visual_chatbot,
	get_visual_multi_agent_chatbot
	)
	from src.feedback import FeedbackManager
	from src.ui_components import (
	get_custom_css,
	display_chunk_statistics_charts,
	display_chunk_statistics_table,
	extract_chunk_statistics,
	display_visual_search_results
	)

	from src.config.paths import (
	IS_DEPLOYED,
	PROJECT_DIR,
	HF_CACHE_DIR,
	FEEDBACK_DIR,
	CONVERSATIONS_DIR,
	)


	# ===== CRITICAL: Fix OMP_NUM_THREADS FIRST, before ANY other imports =====
	# Some libraries load at import time and will fail if OMP_NUM_THREADS is invalid
	omp_threads = os.environ.get("OMP_NUM_THREADS", "")
	try:
	if omp_threads:
	# Handle invalid formats like "3500m" by extracting just the number
	# Remove any non-numeric suffix and convert to int
	cleaned = ''.join(filter(str.isdigit, omp_threads))
	if cleaned:
	threads = int(cleaned)
	if threads <= 0:
	os.environ["OMP_NUM_THREADS"] = "1"
	else:
	# Set the cleaned integer value back
	os.environ["OMP_NUM_THREADS"] = str(threads)
	else:
	os.environ["OMP_NUM_THREADS"] = "1"
	else:
	os.environ["OMP_NUM_THREADS"] = "1"
	except (ValueError, TypeError):
	os.environ["OMP_NUM_THREADS"] = "1"

	# ===== Setup HuggingFace cache directories BEFORE any model imports =====
	# CRITICAL: Set these before any imports that might use HuggingFace (like sentence-transformers)
	# Only override cache directories in deployed environment (local uses defaults)
	if IS_DEPLOYED and HF_CACHE_DIR:
	cache_dir = str(HF_CACHE_DIR)
	os.environ["HF_HOME"] = cache_dir
	os.environ["TRANSFORMERS_CACHE"] = cache_dir
	os.environ["HF_DATASETS_CACHE"] = cache_dir
	os.environ["HF_HUB_CACHE"] = cache_dir
	os.environ["SENTENCE_TRANSFORMERS_HOME"] = cache_dir

	# Ensure cache directory exists (created in Dockerfile, but ensure it's there)
	try:
	os.makedirs(cache_dir, mode=0o755, exist_ok=True)
	except (PermissionError, OSError):
	# If we can't create it, log but continue (might already exist from Dockerfile)
	pass

	else:
	from dotenv import load_dotenv
	load_dotenv()

	# Configure logging
	logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
	logger = logging.getLogger(__name__)

	# Log environment setup for debugging
	# Informational logs (commented out to reduce noise)
	# logger.info(f"📁 PROJECT_DIR: {PROJECT_DIR}")
	# logger.info(f"🌍 Environment: {'DEPLOYED' if IS_DEPLOYED else 'LOCAL'}")
	# logger.info(f"🔧 OMP_NUM_THREADS: {os.environ.get('OMP_NUM_THREADS', 'NOT SET')}")
	# logger.info(f"📁 HuggingFace cache: {os.environ.get('HF_HOME', 'DEFAULT (not overridden)')}")


	# Page config
	st.set_page_config(
	layout="wide",
	page_icon="🔍",
	initial_sidebar_state="expanded",
	page_title="Kalimagezii - Audit Report Analysis"
	)


	# GPU check - only log once at startup
	import torch, sys
	if "gpu_check" not in st.session_state:
	try:
	cuda_ = torch.cuda.is_available()
	mps_ = torch.backends.mps.is_available() if hasattr(torch.backends, 'mps') else False
	if cuda_:
	print(f"🎮 CUDA available: {torch.cuda.get_device_name(0)}")
	elif mps_:
	print("🍎 MPS (Apple Silicon) available")
	else:
	print("💻 CPU only (no GPU acceleration)")
	except Exception as e:
	print(f"⚠️ GPU check error: {e}", file=sys.stderr)
	finally:
	st.session_state.gpu_check = True


	st.markdown(get_custom_css(), unsafe_allow_html=True)


	def get_system_type():
	"""Get the current system type"""
	system = os.environ.get('CHATBOT_SYSTEM', 'multi-agent')
	if system == 'smart':
	return "Smart Chatbot System"
	else:
	return "Multi-Agent System"

	def get_chatbot(version: str = "v1"):
	"""Initialize and return the chatbot based on version"""
	if version == "beta":
	return get_gemini_chatbot()
	elif version == "visual":
	# Use multi-agent architecture for visual mode (same sophisticated logic as v1)
	return get_visual_multi_agent_chatbot()
	else:
	# Check environment variable for system type (v1)
	system = os.environ.get('CHATBOT_SYSTEM', 'multi-agent')
	if system == 'smart':
	return get_smart_chatbot()
	else:
	return get_multi_agent_chatbot()

	def serialize_messages(messages):
	"""Serialize LangChain messages to dictionaries"""
	serialized = []
	for msg in messages:
	if hasattr(msg, 'content'):
	serialized.append({
	"type": type(msg).__name__,
	"content": str(msg.content)
	})
	return serialized

	def serialize_documents(sources):
	"""Serialize document objects to dictionaries with deduplication"""
	serialized = []
	seen_content = set()

	for doc in sources:
	content = getattr(doc, 'page_content', getattr(doc, 'content', ''))

	# Skip if we've seen this exact content before
	if content in seen_content:
	continue

	seen_content.add(content)

	doc_dict = {
	"content": content,
	"metadata": getattr(doc, 'metadata', {}),
	"score": getattr(doc, 'metadata', {}).get('reranked_score', getattr(doc, 'metadata', {}).get('original_score', 0.0)),
	"id": getattr(doc, 'metadata', {}).get('_id', 'unknown'),
	"source": getattr(doc, 'metadata', {}).get('source', 'unknown'),
	"year": getattr(doc, 'metadata', {}).get('year', 'unknown'),
	"district": getattr(doc, 'metadata', {}).get('district', 'unknown'),
	"page": getattr(doc, 'metadata', {}).get('page', 'unknown'),
	"chunk_id": getattr(doc, 'metadata', {}).get('chunk_id', 'unknown'),
	"page_label": getattr(doc, 'metadata', {}).get('page_label', 'unknown'),
	"original_score": getattr(doc, 'metadata', {}).get('original_score', 0.0),
	"reranked_score": getattr(doc, 'metadata', {}).get('reranked_score', None)
	}
	serialized.append(doc_dict)

	return serialized


	feedback_manager = FeedbackManager()


	def load_filter_options(version: str = "v1"):
	"""
	Load filter options based on the selected version.

	For visual mode, only shows filenames available in the visual collection.
	For v1/beta, shows all filenames from the full collection.

	Note: Not cached because visual mode needs fresh imports after code changes.
	"""
	try:
	filter_options_path = PROJECT_DIR / "src" / "config" / "filter_options.json"
	with open(filter_options_path, "r") as f:
	base_options = json.load(f)

	if version == "visual":
	from src.config.visual_filename_mapping import get_visual_filter_options
	visual_options = get_visual_filter_options()
	return {
	'sources': visual_options.get('sources', ['Consolidated']),
	'years': visual_options.get('years', ['2018', '2019', '2020', '2021', '2022']),
	'districts': [],
	'filenames': visual_options.get('filenames', [])
	}

	return base_options
	except FileNotFoundError:
	st.info(f"Looking for filter_options.json in: {PROJECT_DIR / 'src' / 'config'}")
	st.error("filter_options.json not found. Please run the metadata analysis script.")
	return {"sources": [], "years": [], "districts": [], 'filenames': []}

	def main():
	# Initialize session state
	if 'messages' not in st.session_state:
	st.session_state.messages = []
	if 'conversation_id' not in st.session_state:
	st.session_state.conversation_id = f"session_{uuid.uuid4().hex[:8]}"
	if 'session_start_time' not in st.session_state:
	st.session_state.session_start_time = time.time()
	if 'active_filters' not in st.session_state:
	st.session_state.active_filters = {'sources': [], 'years': [], 'districts': [], 'filenames': []}
	# Initialize filter widget keys from active_filters (prevents default/session_state conflict)
	if 'filenames_filter' not in st.session_state:
	st.session_state.filenames_filter = st.session_state.active_filters.get('filenames', [])
	# Track RAG retrieval history for feedback
	if 'rag_retrieval_history' not in st.session_state:
	st.session_state.rag_retrieval_history = []
	# Version selection (v1, beta, or visual)
	if 'chatbot_version' not in st.session_state:
	st.session_state.chatbot_version = "v1"

	# Initialize chatbot based on version (only if not already initialized for this version)
	chatbot_version_key = f"chatbot_{st.session_state.chatbot_version}"

	# Check if we need to initialize: chatbot doesn't exist OR version changed
	needs_init = (
	chatbot_version_key not in st.session_state or
	st.session_state.get('_last_version') != st.session_state.chatbot_version
	)

	if needs_init:
	try:
	# Different spinner messages for different versions
	if st.session_state.chatbot_version == "beta":
	spinner_msg = "🔄 Initializing Gemini FSA..."
	elif st.session_state.chatbot_version == "visual":
	spinner_msg = "🎨 Initializing Visual Search ... This may take 20-30 seconds..."
	else:
	spinner_msg = "🔄 Loading AI models and connecting to database..."

	with st.spinner(spinner_msg):
	st.session_state[chatbot_version_key] = get_chatbot(st.session_state.chatbot_version)
	st.session_state['_last_version'] = st.session_state.chatbot_version
	st.session_state.chatbot = st.session_state[chatbot_version_key]
	print("✅ AI system ready!")
	except Exception as e:
	st.error(f"❌ Failed to initialize chatbot: {str(e)}")
	# Show version-specific error messages
	if st.session_state.chatbot_version == "beta":
	st.error("Please check your environment variables (GEMINI_API_KEY, GEMINI_FILESTORE_NAME for beta)")
	elif st.session_state.chatbot_version == "visual":
	st.error("Please check your environment variables (QDRANT_URL, QDRANT_API_KEY, OPENAI_API_KEY for visual)")
	with st.expander("🐛 Debug Info"):
	import traceback
	st.code(traceback.format_exc())
	else:
	st.error("Please check your configuration and ensure all required models and databases are accessible.")
	# Reset to v1 to prevent infinite loop
	st.session_state.chatbot_version = "v1"
	st.session_state['_last_version'] = "v1"
	if 'chatbot' in st.session_state:
	del st.session_state['chatbot']
	st.stop() # Stop execution to prevent infinite loop
	else:
	# Chatbot already initialized for this version, just use it
	st.session_state.chatbot = st.session_state[chatbot_version_key]

	# Reset conversation history if needed (but keep chatbot cached)
	if 'reset_conversation' in st.session_state and st.session_state.reset_conversation:
	st.session_state.messages = []
	st.session_state.conversation_id = f"session_{uuid.uuid4().hex[:8]}"
	st.session_state.session_start_time = time.time()
	st.session_state.rag_retrieval_history = []
	st.session_state.feedback_submitted = False
	# Clear saliency-related state so no recomputation on clear
	st.session_state.last_rag_result = None
	st.session_state.show_saliency = False
	if 'saliency_cache' in st.session_state:
	st.session_state.saliency_cache = {}
	st.session_state.reset_conversation = False
	st.rerun()


	# Project title - centered at top
	st.markdown("""
	<div style="text-align: center; padding: 10px 0 20px 0;">
	<h1 style="
	font-family: 'Georgia', serif;
	font-size: 2.8rem;
	font-weight: 700;
	color: #1a1a2e;
	letter-spacing: 3px;
	margin: 0;
	text-shadow: 2px 2px 4px rgba(0,0,0,0.1);
	">
	🔍 KALIMAGEZI
	</h1>
	<p style="
	font-family: 'Helvetica Neue', sans-serif;
	font-size: 1rem;
	color: #666;
	margin-top: 5px;
	letter-spacing: 1px;
	">
	Intelligent Audit Report Analysis System
	</p>
	</div>
	""", unsafe_allow_html=True)

	# Version selection radio button (top right)
	col1, col2 = st.columns([3, 1])
	# with col1:
	# st.markdown('<p class="subtitle">Ask questions about audit reports. Use the sidebar filters to narrow down your search!</p>', unsafe_allow_html=True)
	with col2:
	st.markdown("<br>", unsafe_allow_html=True) # Add some spacing
	selected_version = st.radio(
	"Version:",
	options=["v1", "visual", "beta"],
	index=0 if st.session_state.chatbot_version == "v1" else (1 if st.session_state.chatbot_version == "visual" else 2),
	horizontal=True,
	key="version_selector",
	help="Select v1 (default RAG), visual (ColPali visual search), or beta (Gemini FSA)"
	)

	# Update version if changed
	if selected_version != st.session_state.chatbot_version:
	# Store the old version to check if we need to switch
	old_version = st.session_state.chatbot_version
	st.session_state.chatbot_version = selected_version

	# If chatbot for new version already exists, just switch to it
	new_chatbot_key = f"chatbot_{selected_version}"
	if new_chatbot_key in st.session_state:
	# Chatbot already exists, just switch
	st.session_state.chatbot = st.session_state[new_chatbot_key]
	st.session_state['_last_version'] = selected_version
	else:
	# Need to initialize new version - will be handled by initialization logic above
	st.session_state['_last_version'] = old_version # Set to old to trigger init check

	st.rerun()

	# Show version info
	if st.session_state.chatbot_version == "beta":
	st.info("🔬 Beta Mode: Using Google Gemini FSA")
	elif st.session_state.chatbot_version == "visual":
	st.info("🎨 Visual Mode: Using Visual Search (Multi-Modal Embeddings)")

	# Session info
	duration = int(time.time() - st.session_state.session_start_time)
	duration_str = f"{duration // 60}m {duration % 60}s"
	st.markdown(f'''
	<div class="session-info">
	<strong>Session Info:</strong> Messages: {len(st.session_state.messages)} \| Duration: {duration_str} \| Status: Active \| ID: {st.session_state.conversation_id}
	</div>
	''', unsafe_allow_html=True)

	# Load filter options (version-specific for visual mode)
	filter_options = load_filter_options(st.session_state.chatbot_version)

	# Sidebar for filters
	with st.sidebar:
	# Instructions section (collapsible)
	with st.expander("📖 How to Use", expanded=True):
	st.markdown("""
	#### 🎯 Using Filters

	1. Select filters from the sidebar to narrow your search:

	2. Leave filters empty to search across all data

	3. Type your question in the chat input at the bottom

	4. Click "Send" to submit your question

	#### 💡 Tips

	- Use specific questions for better results
	- Combine multiple filters for precise searches
	- Check the "Retrieved Documents" tab to see source material

	#### ⚠️ Important

	When finished, please close the browser window to free up computational resources.

	---

	For more detailed help, see the example questions at the bottom of the page.
	""")

	# Check for pending filter updates (from example question buttons)
	pending_filenames = st.session_state.pop('_pending_filenames', None)
	if pending_filenames is not None:
	st.session_state.active_filters['filenames'] = pending_filenames
	st.session_state.filenames_filter = pending_filenames

	# Filters in a collapsed expander by default
	with st.expander("🔍 Search Filters", expanded=False):
	st.caption("Select filters to narrow down your search. Leave empty to search all data.")

	st.markdown('<div class="filter-section">', unsafe_allow_html=True)
	st.markdown('<div class="filter-title">📄 Specific Reports (Filename Filter)</div>', unsafe_allow_html=True)
	st.markdown('<p style="font-size: 0.85em; color: #666;">⚠️ Selecting specific reports will ignore all other filters</p>', unsafe_allow_html=True)
	selected_filenames = st.multiselect(
	"Select specific reports:",
	options=filter_options.get('filenames', []),
	key="filenames_filter",
	help="Choose specific reports to search. When enabled, all other filters are ignored."
	)
	st.markdown('</div>', unsafe_allow_html=True)

	# Determine if filename filter is active
	filename_mode = len(selected_filenames) > 0

	# Sources filter
	st.markdown('<div class="filter-title">📊 Sources</div>', unsafe_allow_html=True)
	selected_sources = st.multiselect(
	"Select sources:",
	options=filter_options['sources'],
	default=st.session_state.active_filters['sources'],
	disabled = filename_mode,
	key="sources_filter",
	help="Choose which types of reports to search"
	)
	st.markdown('</div>', unsafe_allow_html=True)

	# Years filter
	st.markdown('<div class="filter-title">📅 Years</div>', unsafe_allow_html=True)
	selected_years = st.multiselect(
	"Select years:",
	options=filter_options['years'],
	default=st.session_state.active_filters['years'],
	disabled = filename_mode,
	key="years_filter",
	help="Choose which years to search"
	)
	st.markdown('</div>', unsafe_allow_html=True)

	# Districts filter
	st.markdown('<div class="filter-title">🏘️ Districts</div>', unsafe_allow_html=True)
	selected_districts = st.multiselect(
	"Select districts:",
	options=filter_options['districts'],
	default=st.session_state.active_filters['districts'],
	disabled = filename_mode,
	key="districts_filter",
	help="Choose which districts to search"
	)
	st.markdown('</div>', unsafe_allow_html=True)

	# Clear filters button
	if st.button("🗑️ Clear All Filters", key="clear_filters_button"):
	st.session_state.active_filters = {'sources': [], 'years': [], 'districts': [], 'filenames': []}
	st.rerun()

	# Update active filters (outside expander so it always runs)
	st.session_state.active_filters = {
	'sources': selected_sources if not filename_mode else [],
	'years': selected_years if not filename_mode else [],
	'districts': selected_districts if not filename_mode else [],
	'filenames': selected_filenames
	}

	# Saliency settings (only for visual mode)
	if st.session_state.chatbot_version == "visual":
	with st.expander("🔥 Saliency Maps", expanded=False):
	st.caption("Visualize which image regions are relevant to your query")

	show_saliency = st.checkbox(
	"Enable Saliency Maps",
	value=st.session_state.get('show_saliency', False),
	key="saliency_toggle",
	help="Generate heatmaps showing which parts of each document are most relevant"
	)
	st.session_state.show_saliency = show_saliency

	if show_saliency:
	# Saliency method selection
	saliency_method = st.radio(
	"Method",
	options=["fast:spreaded", "slow:precise", "experimental"],
	index={
	"v3": 0,
	"v2": 1,
	"old": 2
	}.get(st.session_state.get('saliency_method', 'v3'), 0),
	key="saliency_method_radio",
	horizontal=True,
	help="fast:spreaded (V3), slow:precise (V2), experimental (tile-aware legacy)"
	)
	new_method = {
	"fast:spreaded": "v3",
	"slow:precise": "v2",
	"experimental": "old"
	}[saliency_method]

	# Clear saliency cache if method changed
	if st.session_state.get('saliency_method') != new_method:
	st.session_state.saliency_cache = {}
	st.session_state.saliency_method = new_method

	# Set environment variables for the saliency module to use
	import os
	os.environ['SALIENCY_V3'] = '1' if st.session_state.saliency_method == 'v3' else '0'
	os.environ['SALIENCY_V2'] = '1' if st.session_state.saliency_method == 'v2' else '0'
	os.environ['SALIENCY_OLD'] = '1' if st.session_state.saliency_method == 'old' else '0'

	# Advanced options (for debugging)
	# Default storage order: tile (no UI toggle)
	st.session_state.storage_order = 'tile'
	os.environ['SALIENCY_STORAGE_ORDER'] = 'tile'

	# Colormap selection (hot is default)
	colormap_options = ["hot", "jet", "viridis", "plasma", "coolwarm", "RdYlGn"]
	saliency_colormap = st.selectbox(
	"Colormap",
	options=colormap_options,
	index=colormap_options.index(st.session_state.get('saliency_colormap', 'hot')),
	key="saliency_colormap_select",
	help="Color scheme for the heatmap. 'hot' recommended for visibility."
	)
	st.session_state.saliency_colormap = saliency_colormap

	saliency_alpha = st.slider(
	"Overlay Transparency",
	min_value=0.1,
	max_value=0.8,
	value=st.session_state.get('saliency_alpha', 0.4),
	step=0.1,
	key="saliency_alpha_slider",
	help="0.1 = subtle, 0.8 = intense"
	)
	st.session_state.saliency_alpha = saliency_alpha

	saliency_threshold = st.slider(
	"Threshold (%)",
	min_value=0,
	max_value=80,
	value=st.session_state.get('saliency_threshold', 50),
	step=10,
	key="saliency_threshold_slider",
	help="Hide patches below this percentile"
	)
	st.session_state.saliency_threshold = saliency_threshold

	st.markdown("---")
	st.markdown("🎯 Word-Level Saliency")
	st.caption("Select specific words to focus saliency on those words only")

	# Get last query text for word selection
	def _clean_query_text(q: str) -> str:
	if not q:
	return ""
	if "USER QUERY:" in q:
	q = q.split("USER QUERY:", 1)[1]
	return q.strip().strip('"').strip("'")

	last_query = ""
	if hasattr(st.session_state, 'chatbot') and hasattr(st.session_state.chatbot, 'visual_search'):
	last_query = getattr(st.session_state.chatbot.visual_search, 'last_query_text', '')
	last_query = _clean_query_text(last_query)

	if last_query:
	try:
	from src.ui_components.word_selection import get_word_boundaries
	word_boundaries = get_word_boundaries(last_query)
	except ImportError:
	word_boundaries = []
	st.caption("_Word selection unavailable_")

	if word_boundaries:
	st.markdown(f"Query: {last_query}")

	# Initialize selected words if not exists
	if 'selected_saliency_words' not in st.session_state:
	st.session_state.selected_saliency_words = []

	# Create word selection checkboxes
	word_options = [word for _, _, word in word_boundaries]
	selected_words = st.multiselect(
	"Select words for saliency (leave empty for all words):",
	options=word_options,
	default=st.session_state.selected_saliency_words,
	key="saliency_word_selector",
	help="Only selected words will be used for saliency computation"
	)
	st.session_state.selected_saliency_words = selected_words

	# Debug logging - show in UI what's selected
	if selected_words:
	st.caption(f"🎯 Selected: {', '.join(selected_words)}")
	logger.info(f"🔵 SIDEBAR: User selected words: {selected_words}")

	# Add refresh button to force saliency regeneration
	if st.button("🔄 Refresh Saliency", key="refresh_saliency"):
	st.session_state['force_saliency_refresh'] = True
	st.rerun()
	else:
	st.caption("_No words found in query_")
	else:
	st.caption("_Submit a query first to enable word selection_")

	# Main content area with tabs
	tab1, tab2 = st.tabs(["💬 Chat", "📄 Retrieved Documents"])

	with tab1:
	# Chat container
	chat_container = st.container()

	with chat_container:
	# Display conversation history
	for message in st.session_state.messages:
	if isinstance(message, HumanMessage):
	st.markdown(f'<div class="user-message">{message.content}</div>', unsafe_allow_html=True)
	elif isinstance(message, AIMessage):
	st.markdown(f'<div class="bot-message">{message.content}</div>', unsafe_allow_html=True)

	# Input area
	st.markdown("<br>", unsafe_allow_html=True)

	# Create two columns for input and button
	col1, col2 = st.columns([4, 1])

	with col1:
	# Use a counter to force input clearing
	if 'input_counter' not in st.session_state:
	st.session_state.input_counter = 0

	# Handle pending question from example questions section
	if 'pending_question' in st.session_state and st.session_state.pending_question:
	default_value = st.session_state.pending_question
	# Increment counter to force new input widget
	st.session_state.input_counter = (st.session_state.get('input_counter', 0) + 1) % 1000
	del st.session_state.pending_question
	key_suffix = st.session_state.input_counter
	else:
	default_value = ""
	key_suffix = st.session_state.input_counter

	user_input = st.text_input(
	"Type your message here...",
	placeholder="Ask about budget allocations, expenditures, or audit findings...",
	key=f"user_input_{key_suffix}",
	label_visibility="collapsed",
	value=default_value if default_value else None
	)

	with col2:
	send_button = st.button("Send", key="send_button", use_container_width=True)

	# Clear chat button
	if st.button("🗑️ Clear Chat", key="clear_chat_button"):
	print("🗑️ Clearing chat... is clicked")
	logger.info("🗑️ Clearing chat... is clicked")
	st.session_state.reset_conversation = True
	# Clear all conversation files
	conversations_path = CONVERSATIONS_DIR
	if conversations_path.exists():
	for file in conversations_path.iterdir():
	if file.suffix == '.json':
	file.unlink()
	st.rerun()

	# Handle user input
	if send_button and user_input:
	# Construct filter context string
	filter_context_str = ""
	if selected_filenames:
	filter_context_str += "FILTER CONTEXT:\n"
	filter_context_str += f"Filenames: {', '.join(selected_filenames)}\n"
	filter_context_str += "\nUSER QUERY:\n"
	elif selected_sources or selected_years or selected_districts:
	filter_context_str += "FILTER CONTEXT:\n"
	if selected_sources:
	filter_context_str += f"Sources: {', '.join(selected_sources)}\n"
	if selected_years:
	filter_context_str += f"Years: {', '.join(selected_years)}\n"
	if selected_districts:
	filter_context_str += f"Districts: {', '.join(selected_districts)}\n"
	filter_context_str += "\nUSER QUERY:\n"

	full_query = filter_context_str + user_input

	# Add user message to history
	st.session_state.messages.append(HumanMessage(content=user_input))

	# Get chatbot response
	with st.spinner("🤔 Thinking..."):
	try:
	# Pass the full query with filter context
	chat_result = st.session_state.chatbot.chat(full_query, st.session_state.conversation_id)

	# Handle both old format (string) and new format (dict)
	if isinstance(chat_result, dict):
	response = chat_result['response']
	rag_result = chat_result.get('rag_result')
	st.session_state.last_rag_result = rag_result

	# Track RAG retrieval for feedback
	if rag_result:
	sources = rag_result.get('sources', []) if isinstance(rag_result, dict) else (rag_result.sources if hasattr(rag_result, 'sources') else [])

	# For Gemini, also check gemini_result for sources
	if not sources or len(sources) == 0:
	gemini_result = chat_result.get('gemini_result')
	print(f"🔍 DEBUG: Checking gemini_result for sources...")
	print(f" gemini_result exists: {gemini_result is not None}")
	if gemini_result:
	print(f" gemini_result type: {type(gemini_result)}")
	print(f" has sources attr: {hasattr(gemini_result, 'sources')}")
	if hasattr(gemini_result, 'sources'):
	print(f" sources length: {len(gemini_result.sources) if gemini_result.sources else 0}")

	if gemini_result and hasattr(gemini_result, 'sources'):
	# Format Gemini sources for display
	if hasattr(st.session_state.chatbot, 'gemini_client'):
	sources = st.session_state.chatbot.gemini_client.format_sources_for_display(gemini_result)
	print(f"✅ Formatted {len(sources)} sources from gemini_client")
	elif hasattr(st.session_state.chatbot, '_format_gemini_sources'):
	sources = st.session_state.chatbot._format_gemini_sources(gemini_result)
	print(f"✅ Formatted {len(sources)} sources from _format_gemini_sources")

	# Update rag_result with sources if we found them
	if sources and len(sources) > 0:
	if isinstance(rag_result, dict):
	rag_result['sources'] = sources
	elif hasattr(rag_result, 'sources'):
	rag_result.sources = sources
	# Update last_rag_result with sources
	st.session_state.last_rag_result = rag_result
	print(f"✅ Updated rag_result with {len(sources)} sources")

	# Get the actual RAG query
	actual_rag_query = chat_result.get('actual_rag_query', '')
	if actual_rag_query:
	# Format it like the log message
	timestamp = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime())
	formatted_query = f"{timestamp} - INFO - 🔍 ACTUAL RAG QUERY: '{actual_rag_query}'"
	else:
	formatted_query = "No RAG query available"

	# Extract filters from active filters
	filters_used = {
	"sources": st.session_state.active_filters.get('sources', []),
	"years": st.session_state.active_filters.get('years', []),
	"districts": st.session_state.active_filters.get('districts', []),
	"filenames": st.session_state.active_filters.get('filenames', [])
	}

	retrieval_entry = {
	"conversation_up_to": serialize_messages(st.session_state.messages),
	"rag_query_expansion": formatted_query,
	"docs_retrieved": serialize_documents(sources),
	"filters_applied": filters_used,
	"timestamp": time.time()
	}
	st.session_state.rag_retrieval_history.append(retrieval_entry)

	# Debug logging
	print(f"📊 RETRIEVAL TRACKING: {len(sources)} sources stored in retrieval history")
	else:
	response = chat_result
	st.session_state.last_rag_result = None

	# Add bot response to history
	st.session_state.messages.append(AIMessage(content=response))

	except Exception as e:
	error_msg = f"Sorry, I encountered an error: {str(e)}"
	st.session_state.messages.append(AIMessage(content=error_msg))

	# Clear input and rerun
	st.session_state.input_counter += 1 # This will clear the input
	st.rerun()

	with tab2:
	# Document retrieval panel
	if hasattr(st.session_state, 'last_rag_result') and st.session_state.last_rag_result:
	rag_result = st.session_state.last_rag_result

	# Handle both PipelineResult object and dictionary formats
	sources = None
	if hasattr(rag_result, 'sources'):
	# PipelineResult object format
	sources = rag_result.sources
	elif isinstance(rag_result, dict) and 'sources' in rag_result:
	# Dictionary format from multi-agent system or visual search
	sources = rag_result['sources']

	# For Gemini, also check if we need to format sources from gemini_result
	if (not sources or len(sources) == 0) and isinstance(rag_result, dict):
	gemini_result = rag_result.get('gemini_result')
	if gemini_result and hasattr(gemini_result, 'sources'):
	# Format Gemini sources for display
	if hasattr(st.session_state.chatbot, 'gemini_client'):
	sources = st.session_state.chatbot.gemini_client.format_sources_for_display(gemini_result)
	elif hasattr(st.session_state.chatbot, '_format_gemini_sources'):
	sources = st.session_state.chatbot._format_gemini_sources(gemini_result)

	# Check if this is visual search results (has visual metadata)
	is_visual_search = False
	if sources and len(sources) > 0:
	first_doc_metadata = getattr(sources[0], 'metadata', {})
	is_visual_search = 'num_tiles' in first_doc_metadata or 'num_visual_tokens' in first_doc_metadata

	if sources and len(sources) > 0:
	# Use visual display for visual search results
	if is_visual_search and st.session_state.chatbot_version == "visual":
	st.markdown("### 🎨 Visual Search Results")

	# Get saliency settings from session state
	show_saliency = st.session_state.get('show_saliency', False)
	saliency_alpha = st.session_state.get('saliency_alpha', 0.4)
	saliency_threshold = st.session_state.get('saliency_threshold', 75)
	saliency_colormap = st.session_state.get('saliency_colormap', 'hot')
	selected_words = st.session_state.get('selected_saliency_words', [])

	# Initialize selected_token_indices BEFORE the if block
	selected_token_indices = None

	# Get Qdrant client and query embedding for saliency
	qdrant_client = None
	collection_name = None
	query_embedding = None

	# ALWAYS log word selection state for debugging
	logger.info(f"🟢 SALIENCY PROCESSING START")
	logger.info(f" show_saliency={show_saliency}")
	logger.info(f" selected_words from session: {selected_words}")

	# Initialize variables that may be used later (avoid UnboundLocalError)
	qdrant_client = None
	collection_name = None
	query_embedding = None
	query_text = ""
	selected_token_indices = None

	if show_saliency:
	try:
	# Access the visual search adapter from the chatbot
	chatbot = st.session_state.get('chatbot')
	if chatbot and hasattr(chatbot, 'visual_search'):
	visual_search = chatbot.visual_search
	qdrant_client = visual_search.client
	collection_name = visual_search.collection_name
	query_embedding = visual_search.last_query_embedding
	query_text = getattr(visual_search, 'last_query_text', '')

	logger.info(f" query_text: '{query_text[:50] if query_text else 'EMPTY'}'...")
	logger.info(f" query_embedding shape: {query_embedding.shape if hasattr(query_embedding, 'shape') else 'N/A'}")

	if query_embedding is None:
	st.warning("⚠️ Query embedding not available for saliency")
	show_saliency = False
	else:
	# Process word selection
	logger.info(f"🔵 Processing word selection: selected_words={selected_words}")

	if selected_words and query_text:
	from src.ui_components.word_selection import get_token_indices_for_words, get_word_boundaries
	try:
	word_boundaries = get_word_boundaries(query_text)
	word_to_index = {word: idx for idx, (_, _, word) in enumerate(word_boundaries)}

	# Debug: log word mapping
	logger.info(f"🔍 Word selection debug:")
	logger.info(f" Query: '{query_text}'")
	logger.info(f" Selected words: {selected_words}")
	logger.info(f" Available words: {list(word_to_index.keys())}")

	selected_word_indices = [word_to_index[word] for word in selected_words if word in word_to_index]

	if not selected_word_indices:
	logger.warning(f"⚠️ No matching words found! Selected: {selected_words}, Available: {list(word_to_index.keys())}")
	selected_token_indices = None
	else:
	# Get input_ids and attention_mask for accurate mapping
	input_ids = getattr(visual_search, 'last_input_ids', None)
	attention_mask = getattr(visual_search, 'last_attention_mask', None)

	logger.info(f" Word indices: {selected_word_indices}")
	logger.info(f" Has input_ids: {input_ids is not None}, Has attention_mask: {attention_mask is not None}")

	selected_token_indices = get_token_indices_for_words(
	visual_search.processor,
	query_text,
	selected_word_indices,
	input_ids=input_ids,
	attention_mask=attention_mask
	)

	if selected_token_indices:
	logger.info(f"✅ Mapped to {len(selected_token_indices)} token indices")
	logger.debug(f" Token indices: {selected_token_indices[:20]}..." if len(selected_token_indices) > 20 else f" Token indices: {selected_token_indices}")
	else:
	logger.warning("⚠️ Token mapping returned empty list")
	selected_token_indices = None
	except Exception as e:
	logger.error(f"❌ Failed to get token indices for selected words: {e}")
	import traceback
	logger.debug(traceback.format_exc())
	selected_token_indices = None
	else:
	selected_token_indices = None

	logger.info(f"✅ Saliency enabled: colormap={saliency_colormap}, alpha={saliency_alpha}, threshold={saliency_threshold}, selected_words={len(selected_words) if selected_words else 'all'}")
	except Exception as e:
	logger.error(f"Failed to get saliency requirements: {e}")
	st.warning(f"⚠️ Saliency unavailable: {str(e)[:50]}")
	show_saliency = False

	# Extract statistics for charts (same as v1)
	stats = extract_chunk_statistics(sources)

	# Show charts for visual RAG too (like v1)
	if len(sources) >= 5:
	display_chunk_statistics_charts(stats, "Retrieval Statistics")
	st.markdown("---")

	display_visual_search_results(
	sources=sources,
	show_statistics=True,
	show_images=True, # Show Cloudinary images
	show_saliency=show_saliency,
	qdrant_client=qdrant_client,
	collection_name=collection_name,
	query_embedding=query_embedding,
	query_text=query_text, # NEW: Pass query text for V2 saliency
	saliency_alpha=saliency_alpha,
	saliency_colormap=saliency_colormap, # Use selected colormap
	saliency_threshold=saliency_threshold,
	selected_token_indices=selected_token_indices,
	max_display=20
	)
	else:
	# Standard display for v1/beta results
	# Count unique filenames
	unique_filenames = set()
	for doc in sources:
	filename = getattr(doc, 'metadata', {}).get('filename', 'Unknown')
	unique_filenames.add(filename)

	st.markdown(f"Found {len(sources)} document chunks from {len(unique_filenames)} unique documents (showing top 20):")
	if len(unique_filenames) < len(sources):
	st.info(f"💡 Note: Each document is split into multiple chunks. You're seeing {len(sources)} chunks from {len(unique_filenames)} documents.")

	# Extract and display statistics
	stats = extract_chunk_statistics(sources)

	# Show charts for 10+ results, tables for fewer
	if len(sources) >= 10:
	display_chunk_statistics_charts(stats, "Retrieval Statistics")
	# Also show tables below charts for detailed view
	st.markdown("---")
	display_chunk_statistics_table(stats, "Retrieval Distribution")
	else:
	display_chunk_statistics_table(stats, "Retrieval Distribution")

	st.markdown("---")
	st.markdown("### 📄 Document Details")

	# Compute max score for normalization (display only)
	all_scores = []
	for doc in sources:
	m = getattr(doc, 'metadata', {})
	s = m.get('reranked_score') or m.get('original_score') or m.get('score')
	if s is not None:
	try:
	all_scores.append(float(s))
	except (ValueError, TypeError):
	pass
	max_score = max(all_scores) if all_scores else None

	for i, doc in enumerate(sources): # Show all documents
	# Get relevance score and ID if available
	metadata = getattr(doc, 'metadata', {})
	# Handle both standard RAG scores and Gemini scores
	score = metadata.get('reranked_score') or metadata.get('original_score') or metadata.get('score')
	chunk_id = metadata.get('_id') or metadata.get('chunk_id', 'Unknown')
	if score is not None and max_score is not None and max_score > 0:
	try:
	raw_score = float(score)
	relative_pct = (raw_score / max_score) * 100
	score_text = f" (Score: {relative_pct:.1f}% relative \| {raw_score:.3f} raw)"
	except (ValueError, TypeError):
	score_text = ""
	elif score is not None:
	try:
	score_text = f" (Score: {float(score):.3f})"
	except (ValueError, TypeError):
	score_text = ""
	else:
	score_text = ""
	if chunk_id and chunk_id != 'Unknown':
	score_text += f" (ID: {str(chunk_id)[:8]}...)" if score_text else f" (ID: {str(chunk_id)[:8]}...)"

	with st.expander(f"📄 Document {i+1}: {getattr(doc, 'metadata', {}).get('filename', 'Unknown')[:50]}...{score_text}"):
	# Display document metadata with emojis
	metadata = getattr(doc, 'metadata', {})
	col1, col2, col3, col4 = st.columns([2, 1.5, 1, 1])

	with col1:
	st.write(f"📄 File: {metadata.get('filename', 'Unknown')}")
	with col2:
	st.write(f"🏛️ Source: {metadata.get('source', 'Unknown')}")
	with col3:
	st.write(f"📅 Year: {metadata.get('year', 'Unknown')}")
	with col4:
	# Display page number and chunk ID
	page = metadata.get('page_label', metadata.get('page', 'Unknown'))
	chunk_id = metadata.get('_id', 'Unknown')
	st.write(f"📖 Page: {page}")
	st.write(f"🆔 ID: {chunk_id}")

	# Display full content (no truncation)
	content = getattr(doc, 'page_content', 'No content available')
	st.write(f"Full Content:")
	st.text_area("Full Content", value=content, height=300, disabled=True, label_visibility="collapsed", key=f"preview_{i}")
	else:
	st.info("No documents were retrieved for the last query.")
	else:
	st.info("No documents have been retrieved yet. Start a conversation to see retrieved documents here.")

	# Feedback Dashboard Section
	st.markdown("---")
	st.markdown("### 💬 Feedback Dashboard")

	# Check if there's any conversation to provide feedback on
	has_conversation = len(st.session_state.messages) > 0
	has_retrievals = len(st.session_state.rag_retrieval_history) > 0

	if not has_conversation:
	st.info("💡 Start a conversation to provide feedback!")
	st.markdown("The feedback dashboard will be enabled once you begin chatting.")
	else:
	st.markdown("Help us improve by providing feedback on this conversation.")

	# Initialize feedback state if not exists
	if 'feedback_submitted' not in st.session_state:
	st.session_state.feedback_submitted = False

	# Feedback form - only show if feedback not already submitted
	if not st.session_state.feedback_submitted:
	with st.form("feedback_form", clear_on_submit=False):
	col1, col2 = st.columns([1, 1])

	with col1:
	feedback_score = st.slider(
	"Rate this conversation (1-5)",
	min_value=1,
	max_value=5,
	help="How satisfied are you with the conversation?"
	)

	with col2:
	is_feedback_about_last_retrieval = st.checkbox(
	"Feedback about last retrieval only",
	value=True,
	help="If checked, feedback applies to the most recent document retrieval"
	)

	open_ended_feedback = st.text_area(
	"Your feedback (optional)",
	placeholder="Tell us what went well or what could be improved...",
	height=100
	)

	# Disable submit if no score selected
	submit_disabled = feedback_score is None

	submitted = st.form_submit_button(
	"📤 Submit Feedback",
	use_container_width=True,
	disabled=submit_disabled
	)

	if submitted:
	# Log the feedback data being submitted
	print("=" * 80)
	print("🔄 FEEDBACK SUBMISSION: Starting...")
	print("=" * 80)
	st.write("🔍 Debug: Feedback Data Being Submitted:")

	# Extract transcript from messages
	transcript = feedback_manager.extract_transcript(st.session_state.messages)

	# Build retrievals structure
	retrievals = feedback_manager.build_retrievals_structure(

	st.session_state.rag_retrieval_history.copy() if st.session_state.rag_retrieval_history else [],
	st.session_state.messages
	)

	# Build feedback_score_related_retrieval_docs

	feedback_score_related_retrieval_docs = feedback_manager.build_feedback_score_related_retrieval_docs(
	is_feedback_about_last_retrieval,
	st.session_state.messages,
	st.session_state.rag_retrieval_history.copy() if st.session_state.rag_retrieval_history else []
	)

	# Preserve old retrieved_data format for backward compatibility
	retrieved_data_old_format = st.session_state.rag_retrieval_history.copy() if st.session_state.rag_retrieval_history else []

	# Create feedback data dictionary
	feedback_dict = {
	"open_ended_feedback": open_ended_feedback,
	"score": feedback_score,
	"is_feedback_about_last_retrieval": is_feedback_about_last_retrieval,
	"conversation_id": st.session_state.conversation_id,
	"timestamp": time.time(),
	"message_count": len(st.session_state.messages),
	"has_retrievals": has_retrievals,
	"retrieval_count": len(st.session_state.rag_retrieval_history) if st.session_state.rag_retrieval_history else 0,
	"transcript": transcript,
	"retrievals": retrievals,
	"feedback_score_related_retrieval_docs": feedback_score_related_retrieval_docs,
	"retrieved_data": retrieved_data_old_format # Preserved old column
	}

	print(f"📝 FEEDBACK SUBMISSION: Score={feedback_score}, Retrievals={len(st.session_state.rag_retrieval_history) if st.session_state.rag_retrieval_history else 0}")

	# Create UserFeedback dataclass instance
	feedback_obj = None # Initialize outside try block
	try:
	feedback_obj = feedback_manager.create_feedback_from_dict(feedback_dict)
	print(f"✅ FEEDBACK SUBMISSION: Feedback object created - ID={feedback_obj.feedback_id}")
	st.write(f"✅ Feedback Object Created")
	st.write(f"- Feedback ID: {feedback_obj.feedback_id}")
	st.write(f"- Score: {feedback_obj.score}/5")
	st.write(f"- Has Retrievals: {feedback_obj.has_retrievals}")

	# Convert back to dict for JSON serialization
	feedback_data = feedback_obj.to_dict()
	except Exception as e:
	print(f"❌ FEEDBACK SUBMISSION: Failed to create feedback object: {e}")
	st.error(f"Failed to create feedback object: {e}")
	feedback_data = feedback_dict

	# Display the data being submitted
	st.json(feedback_data)

	# Save feedback to file - use PROJECT_DIR to ensure writability
	feedback_dir = FEEDBACK_DIR
	try:
	# Ensure directory exists with write permissions (777 for compatibility)
	feedback_dir.mkdir(parents=True, mode=0o777, exist_ok=True)
	except (PermissionError, OSError) as e:
	logger.warning(f"Could not create feedback directory at {feedback_dir}: {e}")
	# Fallback to relative path
	feedback_dir = Path("feedback")
	feedback_dir.mkdir(parents=True, mode=0o777, exist_ok=True)

	feedback_file = feedback_dir / f"feedback_{st.session_state.conversation_id}_{int(time.time())}.json"

	try:
	# Ensure parent directory exists before writing
	feedback_file.parent.mkdir(parents=True, mode=0o777, exist_ok=True)

	# Save to local file first
	print(f"💾 FEEDBACK SAVE: Saving to local file: {feedback_file}")
	with open(feedback_file, 'w') as f:
	json.dump(feedback_data, f, indent=2, default=str)

	print(f"✅ FEEDBACK SAVE: Local file saved successfully")

	# Save to Snowflake if enabled and credentials available
	logger.info("🔄 FEEDBACK SAVE: Starting Snowflake save process...")
	logger.info(f"📊 FEEDBACK SAVE: feedback_obj={'exists' if feedback_obj else 'None'}")

	snowflake_success = False
	try:
	snowflake_enabled = os.getenv("SNOWFLAKE_ENABLED", "false").lower() == "true"
	logger.info(f"🔍 SNOWFLAKE CHECK: enabled={snowflake_enabled}")

	if snowflake_enabled:
	if feedback_obj:
	try:
	logger.info("📤 SNOWFLAKE UI: Attempting to save feedback to Snowflake...")
	print("📤 SNOWFLAKE UI: Attempting to save feedback to Snowflake...")

	# Show spinner while saving to Snowflake (can take 10-15 seconds)
	# This includes: connection establishment (~5s), data preparation, and SQL execution (~5s)
	with st.spinner("💾 Saving feedback to Snowflake... This may take 10-15 seconds (connecting to database, preparing data, and executing query)"):
	snowflake_success = feedback_manager.save_to_snowflake(feedback_obj)

	if snowflake_success:
	logger.info("✅ SNOWFLAKE UI: Successfully saved to Snowflake")
	print("✅ SNOWFLAKE UI: Successfully saved to Snowflake")
	else:
	logger.warning("⚠️ SNOWFLAKE UI: Save failed")
	print("⚠️ SNOWFLAKE UI: Save failed")
	except Exception as e:
	logger.error(f"❌ SNOWFLAKE UI ERROR: {e}")
	print(f"❌ SNOWFLAKE UI ERROR: {e}")
	traceback.print_exc()
	snowflake_success = False
	else:
	logger.warning("⚠️ SNOWFLAKE UI: Skipping (feedback object not created)")
	print("⚠️ SNOWFLAKE UI: Skipping (feedback object not created)")
	snowflake_success = False
	else:
	logger.info("💡 SNOWFLAKE UI: Integration disabled")
	print("💡 SNOWFLAKE UI: Integration disabled")
	# If Snowflake is disabled, consider it successful (local save only)
	snowflake_success = True

	except Exception as e:
	logger.error(f"❌ Exception in Snowflake save: {type(e).__name__}: {e}")
	print(f"❌ Exception in Snowflake save: {type(e).__name__}: {e}")
	snowflake_success = False

	# Only show success if Snowflake save succeeded (or if Snowflake is disabled)
	if snowflake_success:
	st.success("✅ Thank you for your feedback! It has been saved successfully.")
	st.balloons()
	else:
	st.warning("⚠️ Feedback saved locally, but Snowflake save failed. Please check logs.")

	# Mark feedback as submitted to prevent resubmission
	st.session_state.feedback_submitted = True

	print("=" * 80)
	print(f"✅ FEEDBACK SUBMISSION: Completed successfully")
	print("=" * 80)

	# Log file location
	st.info(f"📁 Feedback saved to: {feedback_file}")

	except Exception as e:
	print(f"❌ FEEDBACK SUBMISSION: Error saving feedback: {e}")
	print(f"❌ FEEDBACK SUBMISSION: Error type: {type(e).__name__}")
	traceback.print_exc()
	st.error(f"❌ Error saving feedback: {e}")
	st.write(f"Debug error: {str(e)}")
	else:
	# Feedback already submitted - show success message and reset option
	st.success("✅ Feedback already submitted for this conversation!")
	col1, col2 = st.columns([1, 1])
	with col1:
	if st.button("🔄 Submit New Feedback", key="new_feedback_button", use_container_width=True):
	try:
	st.session_state.feedback_submitted = False
	st.rerun()
	except Exception as e:
	# Handle any Streamlit API exceptions gracefully
	logger.error(f"Error resetting feedback state: {e}")
	st.error(f"Error resetting feedback. Please refresh the page.")
	with col2:
	if st.button("📋 View Conversation", key="view_conversation_button", use_container_width=True):
	# Scroll to conversation - this is handled by the auto-scroll at bottom
	pass

	# Display retrieval history stats
	if st.session_state.rag_retrieval_history:
	st.markdown("---")
	st.markdown("#### 📊 Retrieval History")

	with st.expander(f"View {len(st.session_state.rag_retrieval_history)} retrieval entries", expanded=False):
	for idx, entry in enumerate(st.session_state.rag_retrieval_history, 1):
	st.markdown(f"### Retrieval #{idx}")

	# Display timestamp if available
	if entry.get("timestamp"):
	timestamp_str = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime(entry["timestamp"]))
	st.caption(f"🕐 {timestamp_str}")

	# Display the actual RAG query
	rag_query_expansion = entry.get("rag_query_expansion", "No query available")
	st.markdown("🔍 RAG Query:")
	st.code(rag_query_expansion, language="text")

	# Display filters used
	filters_applied = entry.get("filters_applied", {})
	if filters_applied and any(filters_applied.values()):
	st.markdown("🎯 Filters Applied:")
	filter_display = {}
	if filters_applied.get("sources"):
	filter_display["Sources"] = filters_applied["sources"]
	if filters_applied.get("years"):
	filter_display["Years"] = filters_applied["years"]
	if filters_applied.get("districts"):
	filter_display["Districts"] = filters_applied["districts"]
	if filters_applied.get("filenames"):
	filter_display["Filenames"] = filters_applied["filenames"]

	if filter_display:
	st.json(filter_display)
	else:
	st.info("No filters applied")
	else:
	st.info("No filters applied")

	# Display conversation history up to retrieval point
	conversation_up_to = entry.get("conversation_up_to", [])
	if conversation_up_to:
	st.markdown("💬 Conversation History (up to retrieval point):")
	with st.expander(f"View {len(conversation_up_to)} messages", expanded=False):
	for msg_idx, msg in enumerate(conversation_up_to, 1):
	role = msg.get("type", "unknown")
	content = msg.get("content", "")

	if role == "HumanMessage" or role == "human":
	st.markdown(f"👤 User {msg_idx}: {content[:200]}{'...' if len(content) > 200 else ''}")
	elif role == "AIMessage" or role == "ai":
	st.markdown(f"🤖 Assistant {msg_idx}: {content[:200]}{'...' if len(content) > 200 else ''}")
	else:
	st.info("No conversation history available")

	# Display documents retrieved
	docs_retrieved = entry.get("docs_retrieved", [])
	if docs_retrieved:
	st.markdown(f"📄 Documents Retrieved ({len(docs_retrieved)}):")

	# Compute max score for normalization
	doc_scores = [d.get("metadata", {}).get("score") for d in docs_retrieved if d.get("metadata", {}).get("score") is not None]
	doc_max_score = max([float(s) for s in doc_scores if s is not None]) if doc_scores else None

	with st.expander(f"View {len(docs_retrieved)} documents", expanded=False):
	for doc_idx, doc in enumerate(docs_retrieved, 1):
	st.markdown(f"Document {doc_idx}:")

	# Display metadata
	metadata = doc.get("metadata", {})
	if metadata:
	col1, col2, col3 = st.columns(3)
	with col1:
	st.write(f"📄 File: {metadata.get('filename', 'Unknown')}")
	with col2:
	st.write(f"🏛️ Source: {metadata.get('source', 'Unknown')}")
	with col3:
	st.write(f"📅 Year: {metadata.get('year', 'Unknown')}")

	# Additional metadata
	if metadata.get('district'):
	st.write(f"📍 District: {metadata.get('district')}")
	if metadata.get('page'):
	st.write(f"📖 Page: {metadata.get('page')}")
	if metadata.get('score') is not None and doc_max_score is not None and doc_max_score > 0:
	try:
	raw = float(metadata.get('score'))
	pct = (raw / doc_max_score) * 100
	st.write(f"⭐ Score: {pct:.1f}%")
	except (ValueError, TypeError):
	st.write(f"⭐ Score: {metadata.get('score')}")

	# Display content preview (first 200 chars)
	content = doc.get("content", doc.get("page_content", ""))
	if content:
	st.markdown("Content Preview:")
	st.text_area(
	"Content Preview",
	value=content[:200] + ("..." if len(content) > 200 else ""),
	height=100,
	disabled=True,
	label_visibility="collapsed",
	key=f"retrieval_{idx}_doc_{doc_idx}_preview"
	)

	if doc_idx < len(docs_retrieved):
	st.markdown("---")
	else:
	st.info("No documents retrieved")

	# Display summary stats
	st.markdown("📊 Summary:")
	st.json({
	"conversation_length": len(conversation_up_to),
	"documents_retrieved": len(docs_retrieved)
	})

	if idx < len(st.session_state.rag_retrieval_history):
	st.markdown("---")

	# Example Questions Section - Single horizontal row layout
	st.markdown("---")

	# Strategy-specific example questions
	is_visual_mode = st.session_state.chatbot_version == "visual"

	# Visual RAG questions with associated filters
	visual_q1 = "Budget amount for the Staff Costs for KCCA under Parish Developement"
	visual_q1_hint = "💡 <b>Hint:</b> select <b>KCCA 2022</b> in the sidebar"
	visual_q1_filters = ["KCCA 2022"]

	visual_q2 = "The impact of the COVID-19 on the finances"
	visual_q2_hint = "💡 <b>Hint:</b> select <b>Annual Consolidated OAG 2019/2020/2021</b> in the sidebar"
	visual_q2_filters = ["Annual Consolidated OAG 2019", "Annual Consolidated OAG 2020", "Annual Consolidated OAG 2021"]

	# Text RAG questions (v1)
	text_q1 = "How were administrative costs managed in the PDM implementation, and what issues arose with budget execution regarding staff salaries?"
	text_q1_hint = "🔄 This question will trigger follow-up prompts for <b>year/district</b>"
	text_q2 = "What did the National Coordinator say about the release of funds for PDM administrative costs in the letter dated 29th September 2022 and how did the funding received affect the activities of the PDCs and PDM SACCOs in the FY 2022/23?"
	text_q2_hint = "✅ Complete question - has <b>year & context</b>, no follow-up needed"

	# Select questions based on mode
	default_q1 = visual_q1 if is_visual_mode else text_q1
	default_q1_hint = visual_q1_hint if is_visual_mode else text_q1_hint
	default_q2 = visual_q2 if is_visual_mode else text_q2
	default_q2_hint = visual_q2_hint if is_visual_mode else text_q2_hint

	# Reset example questions when mode changes
	last_example_mode = st.session_state.get('_last_example_mode', None)
	current_mode = 'visual' if is_visual_mode else 'text'

	if last_example_mode != current_mode and last_example_mode is not None:
	# Force widget keys to new values directly (more reliable than deleting)
	st.session_state.edit_question_2 = default_q1
	st.session_state.edit_question_3 = default_q2
	st.session_state.custom_question_1 = default_q1
	st.session_state.custom_question_2 = default_q2
	st.session_state._last_example_mode = current_mode
	elif last_example_mode is None:
	st.session_state._last_example_mode = current_mode
	st.session_state.edit_question_2 = default_q1
	st.session_state.edit_question_3 = default_q2
	st.session_state.custom_question_1 = default_q1
	st.session_state.custom_question_2 = default_q2

	# Determine if expander should be expanded (only when chat is empty)
	chat_is_empty = len(st.session_state.get('messages', [])) == 0

	# Expandable Example Questions section
	with st.expander("💡 Example Questions", expanded=chat_is_empty):
	# Label row - "Customizable Questions" centered above Q2 and Q3 area
	label_col1, label_col2, label_col3 = st.columns([3, 11, 1])
	with label_col2:
	st.markdown("""
	<div style="
	text-align: center;
	margin-top: 5px;
	margin-bottom: 10px;
	">
	<h3 style="
	color: #666;
	margin: 0;
	font-size: 1.1em;
	font-weight: 600;
	">✏️ Customizable Questions</h3>
	</div>
	""", unsafe_allow_html=True)
	st.write("")
	# Layout: Q1 (left) \| Q2 & Q3 (right) - all at same horizontal level
	q1_col, q23_col = st.columns([1.5, 5.5])

	# Column 1: Question 1 (File Insights) - Non-editable, reduced width
	with q1_col:
	example_q1 = "List couple of insights from the filename."
	st.markdown("📄 File Insights _(select a file first)_")
	st.code(example_q1, language=None)
	if st.button("📋 Use question !", key="use_example_1", use_container_width=True):
	st.session_state.pending_question = example_q1
	st.session_state.input_counter = (st.session_state.get('input_counter', 0) + 1) % 1000
	st.rerun()

	# Column 2: Questions 2 & 3 side by side
	with q23_col:
	q2_col, q3_col = st.columns(2)

	# Question 2
	with q2_col:
	# Display hint with proper HTML formatting
	if is_visual_mode:
	st.markdown(f"<div style='color: #1f77b4; font-weight: 600; margin-bottom: 5px;'>{default_q1_hint}</div>", unsafe_allow_html=True)
	else:
	st.markdown(f"<div style='margin-bottom: 5px;'>{default_q1_hint}</div>", unsafe_allow_html=True)

	custom_q1 = st.text_area(
	"Question 2:",
	height=100,
	key="edit_question_2",
	help="Modify this question to fit your needs"
	)
	if st.button("📋 Use Question 2", key="use_custom_1", use_container_width=True):
	if custom_q1.strip():
	st.session_state.pending_question = custom_q1.strip()
	st.session_state.custom_question_1 = custom_q1.strip()
	st.session_state.input_counter = (st.session_state.get('input_counter', 0) + 1) % 1000
	# Auto-select filters for visual mode (use pending to avoid widget error)
	if is_visual_mode:
	st.session_state._pending_filenames = visual_q1_filters
	st.rerun()
	else:
	st.warning("Please enter a question first!")

	# Question 3
	with q3_col:
	# Display hint with proper HTML formatting
	if is_visual_mode:
	st.markdown(f"<div style='color: #1f77b4; font-weight: 600; margin-bottom: 5px;'>{default_q2_hint}</div>", unsafe_allow_html=True)
	else:
	st.markdown(f"<div style='margin-bottom: 5px;'>{default_q2_hint}</div>", unsafe_allow_html=True)

	custom_q2 = st.text_area(
	"Question 3:",
	height=100,
	key="edit_question_3",
	help="Modify this question to fit your needs"
	)
	if st.button("📋 Use Question 3", key="use_custom_2", use_container_width=True):
	if custom_q2.strip():
	st.session_state.pending_question = custom_q2.strip()
	st.session_state.custom_question_2 = custom_q2.strip()
	st.session_state.input_counter = (st.session_state.get('input_counter', 0) + 1) % 1000
	# Auto-select filters for visual mode (use pending to avoid widget error)
	if is_visual_mode:
	st.session_state._pending_filenames = visual_q2_filters
	st.rerun()
	else:
	st.warning("Please enter a question first!")


	# Store selected question for next render (handled in input section above)
	# This ensures the question populates the input field correctly

	# Auto-scroll to bottom
	st.markdown("""
	<script>
	window.scrollTo(0, document.body.scrollHeight);
	</script>
	""", unsafe_allow_html=True)


	if __name__ == "__main__":
	# Check if running in Streamlit context
	try:
	from streamlit.runtime.scriptrunner import get_script_run_ctx
	if get_script_run_ctx() is None:
	# Not in Streamlit runtime - show helpful message
	print("=" * 80)
	print("⚠️ WARNING: This is a Streamlit app!")
	print("=" * 80)
	print("\nPlease run this app using:")
	print(" streamlit run app.py")
	print("\nNot: python app.py")
	print("\nThe app will not function correctly when run with 'python app.py'")
	print("=" * 80)
	import sys
	sys.exit(1)
	except ImportError:
	# Streamlit not installed or not in Streamlit context
	print("=" * 80)
	print("⚠️ WARNING: This is a Streamlit app!")
	print("=" * 80)
	print("\nPlease run this app using:")
	print(" streamlit run app.py")
	print("\nNot: python app.py")
	print("=" * 80)
	import sys
	sys.exit(1)
	main()