Spaces:

cdpearlman
/

LLMVis

Running

App Files Files Community

LLMVis / app.py

cdpearlman

Fixed chatbot bubble generation bug

d075209 3 days ago

raw

history blame contribute delete

63.1 kB

	"""
	Transformer Explanation Dashboard

	A dashboard focused on explaining how transformer models process input and arrive at predictions.
	Uses a linear pipeline visualization with expandable stages.
	"""

	# Disable TensorFlow before any imports (fixes transformers/TF version incompatibility)
	import os
	os.environ["USE_TF"] = "0"

	from dotenv import load_dotenv
	load_dotenv() # Load environment variables from .env file

	import dash
	from dash import html, dcc, Input, Output, State, callback, no_update, ALL, MATCH
	import json
	import torch
	from utils import (load_model_and_get_patterns, execute_forward_pass, extract_layer_data,
	perform_beam_search, execute_forward_pass_with_multi_layer_head_ablation)
	from utils.head_detection import get_active_head_summary
	from utils.model_config import get_auto_selections
	from utils.token_attribution import compute_integrated_gradients, compute_simple_gradient_attribution

	# Import modular components
	from components.sidebar import create_sidebar
	from components.model_selector import create_model_selector
	from components.glossary import create_glossary_modal
	from components.pipeline import (create_pipeline_container, create_tokenization_content,
	create_embedding_content, create_attention_content,
	create_mlp_content, create_output_content,
	_build_token_display, _build_top5_chart)
	from components.investigation_panel import create_investigation_panel, create_attribution_results_display
	from components.ablation_panel import create_selected_heads_display, create_ablation_results_display
	from components.chatbot import create_chatbot_container, render_messages

	# Initialize Dash app
	app = dash.Dash(
	__name__,
	suppress_callback_exceptions=True,
	external_stylesheets=[
	"https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.0.0/css/all.min.css"
	]
	)
	app.title = "Transformer Explanation Dashboard"


	# ============================================================================
	# APP LAYOUT
	# ============================================================================

	app.layout = html.Div([
	# Glossary Modal
	create_glossary_modal(),

	# Session storage
	dcc.Store(id='session-activation-store', storage_type='memory'),
	dcc.Store(id='session-patterns-store', storage_type='session'),
	dcc.Store(id='session-activation-store-original', storage_type='memory'),
	dcc.Store(id='sidebar-collapse-store', storage_type='session', data=True),
	dcc.Store(id='generation-results-store', storage_type='session'),
	dcc.Store(id='investigation-active-tab', storage_type='session', data='ablation'),
	dcc.Store(id='ablation-selected-heads', storage_type='session', data=[]),
	# Agent F: Stores for separating original prompt analysis from beam generation
	dcc.Store(id='session-original-prompt-store', storage_type='memory'), # Original user prompt
	dcc.Store(id='session-selected-beam-store', storage_type='memory'), # Selected beam for comparison

	# Main container
	html.Div([
	# Header
	html.Div([
	html.H1("Transformer Explanation Dashboard", className="header-title"),
	html.P("Understand how transformer models process text and make predictions",
	className="header-subtitle")
	], className="header"),

	# Main content area
	html.Div([
	# Left sidebar
	html.Div([
	create_sidebar()
	], id="sidebar-container", className="sidebar collapsed"),

	# Right main panel
	html.Div([
	# Generator Interface
	html.Div([
	html.H3("Input", className="section-title"),
	create_model_selector(),

	# Generation Settings
	html.Div([
	html.H4("Generation Settings", style={'fontSize': '14px', 'marginTop': '15px', 'marginBottom': '10px'}),

	html.Div([
	html.Div([
	html.Label("Number of New Tokens:", className="input-label"),
	dcc.Slider(
	id='max-new-tokens-slider',
	min=1, max=20, step=1, value=1,
	marks={1: '1', 5: '5', 10: '10', 20: '20'},
	tooltip={"placement": "bottom", "always_visible": True}
	)
	], style={'flex': '1', 'marginRight': '20px'}),

	html.Div([
	html.Label("Options to Generate:", className="input-label"),
	dcc.Slider(
	id='beam-width-slider',
	min=1, max=5, step=1, value=1,
	marks={1: '1', 3: '3', 5: '5'},
	tooltip={"placement": "bottom", "always_visible": True}
	),
	html.P("Generate multiple possible completions to compare",
	style={'color': '#6c757d', 'fontSize': '11px', 'marginTop': '4px', 'marginBottom': '0'})
	], style={'flex': '1'})
	], style={'display': 'flex', 'marginBottom': '20px'}),

	html.Button(
	[html.I(className="fas fa-play", style={'marginRight': '8px'}), "Analyze"],
	id="generate-btn",
	className="action-button primary-button",
	disabled=True,
	style={'width': '100%', 'padding': '12px', 'fontSize': '16px'}
	)
	], style={'padding': '15px', 'backgroundColor': '#f8f9fa', 'borderRadius': '8px', 'marginTop': '15px'})

	], className="config-section"),

	# Results List (for beam search)
	dcc.Loading(
	id="generation-loading",
	type="default",
	children=html.Div(id="generation-results-container", style={'marginTop': '20px'}),
	color='#667eea'
	),

	# Pipeline Visualization
	dcc.Loading(
	id="pipeline-loading",
	type="default",
	children=html.Div([
	html.Hr(style={'margin': '30px 0', 'borderTop': '1px solid #dee2e6'}),
	create_pipeline_container()
	], id="pipeline-section"),
	color='#667eea',
	style={'minHeight': '100px'}
	),

	# Investigation Panel
	dcc.Loading(
	id="investigation-loading",
	type="default",
	children=html.Div([
	html.Hr(style={'margin': '30px 0', 'borderTop': '1px solid #dee2e6'}),
	create_investigation_panel()
	], id="investigation-section"),
	color='#667eea',
	style={'minHeight': '100px'}
	)

	], className="main-panel")
	], className="content-container")
	], className="app-container"),

	# AI Chatbot
	create_chatbot_container()
	], className="app-wrapper")


	# ============================================================================
	# CALLBACKS: Glossary
	# ============================================================================

	@app.callback(
	[Output("glossary-overlay-bg", "className"),
	Output("glossary-drawer-content", "className")],
	[Input("open-glossary-btn", "n_clicks"),
	Input("close-glossary-btn", "n_clicks"),
	Input("glossary-overlay-bg", "n_clicks")],
	prevent_initial_call=True
	)
	def toggle_glossary(open_clicks, close_clicks, overlay_clicks):
	ctx = dash.callback_context
	if not ctx.triggered:
	return no_update, no_update
	trigger_id = ctx.triggered[0]["prop_id"].split(".")[0]
	if trigger_id == "open-glossary-btn":
	return "glossary-overlay open", "glossary-drawer open"
	else:
	return "glossary-overlay", "glossary-drawer"


	# ============================================================================
	# CALLBACKS: Model Loading
	# ============================================================================

	@app.callback(
	[Output('session-patterns-store', 'data'),
	Output('attention-modules-dropdown', 'options'),
	Output('block-modules-dropdown', 'options'),
	Output('norm-params-dropdown', 'options'),
	Output('attention-modules-dropdown', 'value', allow_duplicate=True),
	Output('block-modules-dropdown', 'value', allow_duplicate=True),
	Output('norm-params-dropdown', 'value', allow_duplicate=True),
	Output('loading-indicator', 'children'),
	# Clear all stale stores when model changes
	Output('session-activation-store', 'data', allow_duplicate=True),
	Output('session-activation-store-original', 'data', allow_duplicate=True),
	Output('generation-results-store', 'data', allow_duplicate=True),
	Output('generation-results-container', 'children', allow_duplicate=True),
	Output('session-original-prompt-store', 'data', allow_duplicate=True),
	Output('session-selected-beam-store', 'data', allow_duplicate=True),
	Output('ablation-selected-heads', 'data', allow_duplicate=True),
	Output('pipeline-container', 'style', allow_duplicate=True),
	Output('investigation-panel', 'style', allow_duplicate=True)],
	[Input('model-dropdown', 'value')],
	prevent_initial_call=True
	)
	def load_model_patterns(selected_model):
	"""Load and categorize model patterns when a model is selected."""
	# 9 new cleared outputs: activation, activation-original, gen-results-store,
	# gen-results-container, original-prompt, selected-beam, ablation-heads,
	# pipeline style, investigation style
	cleared_stores = ({}, {}, None, [], {}, {}, [], {'display': 'none'}, {'display': 'none'})
	if not selected_model:
	return ({}, [], [], [], None, None, None, None) + cleared_stores

	try:
	module_patterns, param_patterns = load_model_and_get_patterns(selected_model)

	def create_grouped_options(patterns_dict, filter_keywords, option_type):
	filtered_options = []
	other_options = []
	for pattern, items in patterns_dict.items():
	pattern_lower = pattern.lower()
	option = {'label': pattern, 'value': pattern, 'title': f"{len(items)} {option_type} matching this pattern"}
	if any(keyword in pattern_lower for keyword in filter_keywords):
	filtered_options.append(option)
	else:
	other_options.append(option)
	result = []
	if filtered_options:
	result.extend(filtered_options)
	if other_options:
	result.append({'label': '─── Other Options ───', 'value': '_separator_', 'disabled': True})
	result.extend(other_options)
	else:
	result.extend(other_options)
	return result

	attention_options = create_grouped_options(module_patterns, ['attn', 'attention'], 'modules')
	block_options = create_grouped_options(module_patterns, ['layers', 'h.', 'blocks', 'decoder.layers'], 'modules')
	norm_options = create_grouped_options(param_patterns, ['norm', 'layernorm', 'layer_norm'], 'params')

	auto_selections = get_auto_selections(selected_model, module_patterns, param_patterns)

	patterns_data = {
	'module_patterns': module_patterns,
	'param_patterns': param_patterns,
	'selected_model': selected_model,
	'family': auto_selections.get('family_name'),
	'family_description': auto_selections.get('family_description', '')
	}

	family_name = auto_selections.get('family_name')
	if family_name:
	loading_content = html.Div([
	html.I(className="fas fa-check-circle", style={'color': '#28a745', 'marginRight': '8px'}),
	html.Div([
	html.Div("Model loaded successfully!"),
	html.Div(f"Detected family: {auto_selections.get('family_description', family_name)}",
	style={'fontSize': '12px', 'color': '#6c757d', 'marginTop': '4px'})
	])
	], className="status-success")
	else:
	loading_content = html.Div([
	html.I(className="fas fa-check-circle", style={'color': '#28a745', 'marginRight': '8px'}),
	"Model loaded - manual selection required"
	], className="status-success")

	return (patterns_data, attention_options, block_options, norm_options,
	auto_selections.get('attention_selection', []),
	auto_selections.get('block_selection', []),
	auto_selections.get('norm_selection', []),
	loading_content) + cleared_stores

	except Exception as e:
	print(f"Error loading model patterns: {e}")
	error_content = html.Div([
	html.I(className="fas fa-exclamation-triangle", style={'color': '#dc3545', 'marginRight': '8px'}),
	f"Error loading model: {str(e)}"
	], className="status-error")
	return ({}, [], [], [], None, None, None, error_content) + cleared_stores


	@app.callback(
	Output('loading-indicator', 'children', allow_duplicate=True),
	[Input('model-dropdown', 'value')],
	prevent_initial_call=True
	)
	def show_loading_spinner(selected_model):
	if not selected_model:
	return None
	return html.Div([
	html.I(className="fas fa-spinner fa-spin", style={'marginRight': '8px'}),
	"Loading model..."
	], className="status-loading")


	@app.callback(
	[Output('attention-modules-dropdown', 'value'),
	Output('block-modules-dropdown', 'value'),
	Output('norm-params-dropdown', 'value'),
	Output('session-activation-store', 'data', allow_duplicate=True),
	Output('loading-indicator', 'children', allow_duplicate=True)],
	[Input('clear-selections-btn', 'n_clicks')],
	prevent_initial_call=True
	)
	def clear_all_selections(n_clicks):
	if not n_clicks:
	return no_update
	cleared_status = html.Div([
	html.I(className="fas fa-broom", style={'color': '#6c757d', 'marginRight': '8px'}),
	"All selections cleared"
	], className="status-cleared")
	return None, None, None, {}, cleared_status


	@app.callback(
	Output('generate-btn', 'disabled'),
	[Input('model-dropdown', 'value'),
	Input('prompt-input', 'value'),
	Input('block-modules-dropdown', 'value'),
	Input('norm-params-dropdown', 'value')]
	)
	def enable_run_button(model, prompt, block_modules, norm_params):
	return not (model and prompt and block_modules and norm_params)


	# ============================================================================
	# CALLBACKS: Generation & Analysis
	# ============================================================================

	@app.callback(
	[Output('generation-results-container', 'children'),
	Output('generation-results-store', 'data'),
	Output('pipeline-container', 'style'),
	Output('investigation-panel', 'style'),
	Output('session-activation-store', 'data', allow_duplicate=True),
	Output('session-activation-store-original', 'data', allow_duplicate=True),
	Output('session-original-prompt-store', 'data'),
	Output('session-selected-beam-store', 'data')],
	[Input('generate-btn', 'n_clicks')],
	[State('model-dropdown', 'value'),
	State('prompt-input', 'value'),
	State('max-new-tokens-slider', 'value'),
	State('beam-width-slider', 'value'),
	State('session-patterns-store', 'data'),
	State('attention-modules-dropdown', 'value'),
	State('block-modules-dropdown', 'value'),
	State('norm-params-dropdown', 'value')],
	prevent_initial_call=True
	)
	def run_generation(n_clicks, model_name, prompt, max_new_tokens, beam_width, patterns_data, attn_patterns, block_patterns, norm_patterns):
	"""
	Run generation and analysis.

	Agent F refactor: Pipeline analysis (tokenization, embedding, attention, MLP, output)
	always runs on the ORIGINAL PROMPT only. Beam generation results are stored separately
	for comparison in experiments.
	"""
	if not n_clicks or not model_name or not prompt:
	return no_update, no_update, no_update, no_update, no_update, no_update, no_update, no_update

	try:
	from transformers import AutoModelForCausalLM, AutoTokenizer
	model = AutoModelForCausalLM.from_pretrained(model_name, attn_implementation='eager')
	tokenizer = AutoTokenizer.from_pretrained(model_name)
	model.eval()

	# Always run beam search (even with max_new_tokens=1)
	results = perform_beam_search(model, tokenizer, prompt, beam_width, max_new_tokens)

	# Store original prompt for reference
	original_prompt_data = {'prompt': prompt, 'model': model_name}

	# Build module config for analysis
	module_patterns = patterns_data.get('module_patterns', {})
	param_patterns = patterns_data.get('param_patterns', {})

	config = {
	'attention_modules': [mod for pattern in (attn_patterns or []) for mod in module_patterns.get(pattern, [])],
	'block_modules': [mod for pattern in (block_patterns or []) for mod in module_patterns.get(pattern, [])],
	'norm_parameters': [param for pattern in (norm_patterns or []) for param in param_patterns.get(pattern, [])]
	}

	if not config['block_modules']:
	return (html.Div("Please select modules in the sidebar.", style={'color': 'red'}),
	results, {'display': 'none'}, {'display': 'none'}, {}, {}, original_prompt_data, {})

	# For single-token generation, analyze the full output (prompt + generated token)
	# so attention covers the entire sequence. For multi-token, start with prompt only;
	# the full-sequence analysis runs when the user selects a beam.
	if max_new_tokens == 1:
	full_text = results[0]['text']
	# Pass original_prompt so per-position top-5 is computed for the scrubber
	activation_data = execute_forward_pass(model, tokenizer, full_text, config,
	original_prompt=prompt)
	else:
	full_text = prompt
	activation_data = execute_forward_pass(model, tokenizer, full_text, config)

	results_ui = []
	if max_new_tokens > 1:
	# Show generated sequences for user selection
	results_ui.append(html.H4("Generated Sequences", className="section-title"))
	results_ui.append(html.P("Select a sequence to store for comparison after experiments.",
	style={'color': '#6c757d', 'fontSize': '13px', 'marginBottom': '12px'}))
	for i, result in enumerate(results):
	results_ui.append(html.Div([
	html.Div([
	html.Span(f"Rank {i+1}", style={'fontWeight': 'bold', 'marginRight': '10px', 'color': '#667eea'})
	], style={'marginBottom': '5px'}),
	html.Div(result['text'], style={'fontFamily': 'monospace', 'backgroundColor': '#fff', 'padding': '10px', 'borderRadius': '4px', 'border': '1px solid #dee2e6'}),
	html.Button("Select for Comparison", id={'type': 'result-item', 'index': i}, n_clicks=0,
	className="action-button secondary-button", style={'marginTop': '10px', 'fontSize': '12px'})
	], style={'marginBottom': '15px', 'padding': '15px', 'backgroundColor': '#f8f9fa', 'borderRadius': '6px'}))

	# Show pipeline immediately (analyzing original prompt)
	return (results_ui, results, {'display': 'block'}, {'display': 'block'},
	activation_data, activation_data, original_prompt_data, {})

	else:
	if beam_width > 1:
	# Multiple beams, single token — show selection UI
	results_ui.append(html.H4("Generated Sequences", className="section-title"))
	results_ui.append(html.P("Select a sequence to store for comparison after experiments.",
	style={'color': '#6c757d', 'fontSize': '13px', 'marginBottom': '12px'}))
	for i, result in enumerate(results):
	results_ui.append(html.Div([
	html.Div([
	html.Span(f"Rank {i+1}", style={'fontWeight': 'bold', 'marginRight': '10px', 'color': '#667eea'})
	], style={'marginBottom': '5px'}),
	html.Div(result['text'], style={'fontFamily': 'monospace', 'backgroundColor': '#fff', 'padding': '10px', 'borderRadius': '4px', 'border': '1px solid #dee2e6'}),
	html.Button("Select for Comparison", id={'type': 'result-item', 'index': i}, n_clicks=0,
	className="action-button secondary-button", style={'marginTop': '10px', 'fontSize': '12px'})
	], style={'marginBottom': '15px', 'padding': '15px', 'backgroundColor': '#f8f9fa', 'borderRadius': '6px'}))
	selected_beam_data = {}
	else:
	# Single beam, single token — auto-select and show "Selected" badge
	result = results[0]
	selected_beam_data = {'text': result['text'], 'score': result.get('score', 0)}
	results_ui.append(html.Div([
	html.H4("Selected Sequence", className="section-title"),
	html.Div([
	html.Div([
	html.Span([
	html.I(className="fas fa-check-circle", style={'marginRight': '8px', 'color': '#28a745'}),
	"Selected for Comparison"
	], style={
	'display': 'inline-flex', 'alignItems': 'center',
	'padding': '6px 12px', 'backgroundColor': '#d4edda',
	'color': '#155724', 'borderRadius': '16px',
	'fontSize': '12px', 'fontWeight': '500', 'marginBottom': '12px'
	})
	]),
	html.Div(result['text'], style={
	'fontFamily': 'monospace', 'backgroundColor': '#fff',
	'padding': '12px', 'borderRadius': '6px', 'border': '2px solid #28a745'
	})
	], style={
	'padding': '16px', 'backgroundColor': '#f8f9fa',
	'borderRadius': '8px', 'border': '1px solid #dee2e6'
	})
	]))

	return (results_ui, results, {'display': 'block'}, {'display': 'block'},
	activation_data, activation_data, original_prompt_data, selected_beam_data)

	except Exception as e:
	import traceback
	traceback.print_exc()
	return (html.Div(f"Error: {e}", style={'color': 'red'}), [],
	{'display': 'none'}, {'display': 'none'}, {}, {}, {}, {})


	@app.callback(
	[Output('session-selected-beam-store', 'data', allow_duplicate=True),
	Output('generation-results-container', 'children', allow_duplicate=True),
	Output('session-activation-store', 'data', allow_duplicate=True),
	Output('session-activation-store-original', 'data', allow_duplicate=True)],
	Input({'type': 'result-item', 'index': ALL}, 'n_clicks'),
	[State('generation-results-store', 'data'),
	State('session-activation-store', 'data'),
	State('session-original-prompt-store', 'data')],
	prevent_initial_call=True
	)
	def store_selected_beam(n_clicks_list, results_data, existing_activation_data, original_prompt_data):
	"""
	Store selected beam and re-run forward pass on the full sequence.

	When a beam is selected, this re-runs execute_forward_pass on the complete
	generated text (prompt + output) so the attention visualization covers
	the entire chosen output, not just the input.
	"""
	if not any(n_clicks_list) or not results_data:
	return no_update, no_update, no_update, no_update

	ctx = dash.callback_context
	if not ctx.triggered:
	return no_update, no_update, no_update, no_update

	triggered_id = json.loads(ctx.triggered[0]['prop_id'].split('.')[0])
	index = triggered_id['index']

	result = results_data[index]

	# Build UI showing only the selected sequence with a "selected" badge
	selected_ui = html.Div([
	html.H4("Selected Sequence", className="section-title"),
	html.Div([
	html.Div([
	html.Span([
	html.I(className="fas fa-check-circle", style={'marginRight': '8px', 'color': '#28a745'}),
	"Selected for Comparison"
	], style={
	'display': 'inline-flex',
	'alignItems': 'center',
	'padding': '6px 12px',
	'backgroundColor': '#d4edda',
	'color': '#155724',
	'borderRadius': '16px',
	'fontSize': '12px',
	'fontWeight': '500',
	'marginBottom': '12px'
	})
	]),
	html.Div(result['text'], style={
	'fontFamily': 'monospace',
	'backgroundColor': '#fff',
	'padding': '12px',
	'borderRadius': '6px',
	'border': '2px solid #28a745'
	})
	], style={
	'padding': '16px',
	'backgroundColor': '#f8f9fa',
	'borderRadius': '8px',
	'border': '1px solid #dee2e6'
	})
	])

	# Re-run forward pass on the full beam text so attention covers entire output
	new_activation_data = no_update
	if existing_activation_data:
	try:
	from transformers import AutoModelForCausalLM, AutoTokenizer
	model_name = existing_activation_data['model']
	config = {
	'attention_modules': existing_activation_data['attention_modules'],
	'block_modules': existing_activation_data['block_modules'],
	'norm_parameters': existing_activation_data.get('norm_parameters', [])
	}
	model = AutoModelForCausalLM.from_pretrained(model_name, attn_implementation='eager')
	tokenizer = AutoTokenizer.from_pretrained(model_name)
	model.eval()
	# Pass original_prompt so per-position top-5 data is computed for scrubber
	orig_prompt = original_prompt_data.get('prompt', '') if original_prompt_data else ''
	new_activation_data = execute_forward_pass(
	model, tokenizer, result['text'], config,
	original_prompt=orig_prompt
	)
	except Exception as e:
	import traceback
	traceback.print_exc()
	print(f"Warning: Could not re-run forward pass for full sequence: {e}")

	# Store the selected beam for comparison after experiments
	return ({'text': result['text'], 'score': result.get('score', 0), 'index': index},
	selected_ui, new_activation_data, new_activation_data)


	# ============================================================================
	# CALLBACKS: Pipeline Stage Content
	# ============================================================================

	@app.callback(
	[Output('stage-1-summary', 'children'),
	Output('stage-1-content', 'children'),
	Output('stage-2-summary', 'children'),
	Output('stage-2-content', 'children'),
	Output('stage-3-summary', 'children'),
	Output('stage-3-content', 'children'),
	Output('stage-4-summary', 'children'),
	Output('stage-4-content', 'children'),
	Output('stage-5-summary', 'children'),
	Output('stage-5-content', 'children')],
	[Input('session-activation-store', 'data')],
	[State('model-dropdown', 'value')]
	)
	def update_pipeline_content(activation_data, model_name):
	"""Update all pipeline stage content based on activation data."""
	empty_outputs = ["Awaiting analysis...", html.P("Run analysis to see details.", style={'color': '#6c757d'})] * 5

	if not activation_data or not model_name:
	return tuple(empty_outputs)

	# Safety check: ensure activation data matches the current model
	data_model = activation_data.get('model', '')
	if data_model and data_model != model_name and data_model != 'unknown':
	# Stale activation data from a different model — show empty
	return tuple(empty_outputs)

	try:
	from transformers import AutoModelForCausalLM, AutoTokenizer
	model = AutoModelForCausalLM.from_pretrained(model_name, attn_implementation='eager')
	tokenizer = AutoTokenizer.from_pretrained(model_name)

	# Use pre-decoded tokens if available, otherwise decode from input_ids
	input_ids = activation_data.get('input_ids', [[]])[0]
	tokens = activation_data.get('tokens') or [tokenizer.decode([tid]) for tid in input_ids]
	layer_data = extract_layer_data(activation_data, model, tokenizer)

	# Use stored model config if available, otherwise read from model
	model_cfg = activation_data.get('model_config', {})
	hidden_dim = model_cfg.get('hidden_size', model.config.hidden_size)
	num_heads = model_cfg.get('num_attention_heads', model.config.num_attention_heads)
	num_layers = model_cfg.get('num_hidden_layers', model.config.num_hidden_layers)
	intermediate_dim = model_cfg.get('intermediate_size', getattr(model.config, 'intermediate_size', hidden_dim * 4))

	# Get actual output
	actual_output = activation_data.get('actual_output', {})
	predicted_token = actual_output.get('token', '')
	predicted_prob = actual_output.get('probability', 0)

	# Get global top 5
	global_top5 = activation_data.get('global_top5_tokens', [])
	if global_top5:
	if isinstance(global_top5[0], dict):
	top_tokens = [(t['token'], t['probability']) for t in global_top5]
	else:
	top_tokens = global_top5
	else:
	top_tokens = []

	# Generate BertViz HTML
	from utils import generate_bertviz_html
	attention_html = None
	try:
	attention_html = generate_bertviz_html(activation_data, 0, 'full')
	except:
	pass

	# Get head categorization from pre-computed JSON + runtime verification
	head_categories = None
	try:
	from utils.head_detection import get_active_head_summary
	head_categories = get_active_head_summary(activation_data, model_name)
	except:
	pass

	# Build outputs for each stage
	outputs = []

	# Stage 1: Tokenization
	outputs.append(f"{len(tokens)} tokens")
	outputs.append(create_tokenization_content(tokens, input_ids))

	# Stage 2: Embedding
	outputs.append(f"{hidden_dim}-dim vectors")
	outputs.append(create_embedding_content(hidden_dim, len(tokens)))

	# Stage 3: Attention (Agent G: now includes head_categories)
	outputs.append(f"{num_heads} heads × {num_layers} layers")
	outputs.append(create_attention_content(attention_html, None, head_categories=head_categories))

	# Stage 4: MLP
	outputs.append(f"{num_layers} layers")
	outputs.append(create_mlp_content(num_layers, hidden_dim, intermediate_dim))

	# Stage 5: Output
	# Get original prompt for context display
	original_prompt = activation_data.get('prompt', '')
	# Per-position data for the scrubber (populated when original_prompt was given)
	per_position_data = activation_data.get('per_position_top5', [])
	generated_tokens = activation_data.get('generated_tokens', [])
	scrubber_prompt = activation_data.get('original_prompt', original_prompt)

	outputs.append(f"→ {predicted_token}")
	outputs.append(create_output_content(
	top_tokens, predicted_token, predicted_prob,
	original_prompt=original_prompt,
	per_position_data=per_position_data,
	generated_tokens=generated_tokens,
	prompt_text=scrubber_prompt
	))

	return tuple(outputs)

	except Exception as e:
	import traceback
	traceback.print_exc()
	return tuple(empty_outputs)


	# ============================================================================
	# CALLBACKS: Output Scrubber
	# ============================================================================

	@app.callback(
	[Output('output-token-display', 'children'),
	Output('output-top5-chart', 'children')],
	[Input('output-scrubber-slider', 'value')],
	[State('session-activation-store', 'data')],
	prevent_initial_call=True
	)
	def update_output_scrubber(position, activation_data):
	"""Update the token display and top-5 chart when the scrubber slider moves."""
	if activation_data is None or position is None:
	return no_update, no_update

	per_position_data = activation_data.get('per_position_top5', [])
	generated_tokens = activation_data.get('generated_tokens', [])
	prompt_text = activation_data.get('original_prompt', activation_data.get('prompt', ''))

	if not per_position_data or not generated_tokens:
	return no_update, no_update

	# Clamp position to valid range
	position = max(0, min(position, len(per_position_data) - 1))
	pos_data = per_position_data[position]

	token_display = _build_token_display(
	prompt_text, generated_tokens, position, pos_data['actual_prob']
	)
	top5_chart = _build_top5_chart(pos_data['top5'], pos_data.get('actual_token'))

	return token_display, top5_chart


	# ============================================================================
	# CALLBACKS: Sidebar
	# ============================================================================

	@app.callback(
	[Output('sidebar-collapse-store', 'data'),
	Output('sidebar-content', 'style'),
	Output('sidebar-container', 'className'),
	Output('sidebar-toggle-btn', 'children')],
	[Input('sidebar-toggle-btn', 'n_clicks')],
	[State('sidebar-collapse-store', 'data')],
	prevent_initial_call=False
	)
	def toggle_sidebar(n_clicks, is_collapsed):
	if n_clicks is None:
	return True, {'display': 'none'}, 'sidebar collapsed', html.I(className="fas fa-chevron-right")

	new_collapsed = not is_collapsed
	style = {'display': 'none'} if new_collapsed else {'display': 'block'}
	class_name = 'sidebar collapsed' if new_collapsed else 'sidebar'
	icon = html.I(className="fas fa-chevron-right") if new_collapsed else html.I(className="fas fa-chevron-left")

	return new_collapsed, style, class_name, icon


	# ============================================================================
	# CALLBACKS: Investigation Panel - Tabs
	# ============================================================================

	@app.callback(
	[Output('investigation-active-tab', 'data'),
	Output('investigation-tab-ablation', 'style'),
	Output('investigation-tab-attribution', 'style'),
	Output('investigation-ablation-content', 'style'),
	Output('investigation-attribution-content', 'style')],
	[Input('investigation-tab-ablation', 'n_clicks'),
	Input('investigation-tab-attribution', 'n_clicks')],
	[State('investigation-active-tab', 'data')],
	prevent_initial_call=True
	)
	def switch_investigation_tab(abl_clicks, attr_clicks, current_tab):
	ctx = dash.callback_context
	if not ctx.triggered:
	return no_update, no_update, no_update, no_update, no_update

	triggered_id = ctx.triggered[0]['prop_id'].split('.')[0]

	active_style = {'padding': '10px 20px', 'border': 'none', 'borderRadius': '6px', 'cursor': 'pointer',
	'fontSize': '14px', 'fontWeight': '500', 'backgroundColor': '#667eea', 'color': 'white'}
	inactive_style = {'padding': '10px 20px', 'border': 'none', 'borderRadius': '6px', 'cursor': 'pointer',
	'fontSize': '14px', 'fontWeight': '500', 'backgroundColor': '#f8f9fa', 'color': '#495057'}

	if triggered_id == 'investigation-tab-ablation':
	return 'ablation', active_style, inactive_style, {'display': 'block'}, {'display': 'none'}
	else:
	return 'attribution', inactive_style, active_style, {'display': 'none'}, {'display': 'block'}


	# ============================================================================
	# CALLBACKS: Investigation Panel - Ablation (Updated for New UI)
	# ============================================================================

	@app.callback(
	[Output('ablation-layer-select', 'options'),
	Output('ablation-head-select', 'options')],
	[Input('session-activation-store', 'data'),
	Input('ablation-layer-select', 'value')],
	[State('model-dropdown', 'value')]
	)
	def update_ablation_selectors(activation_data, selected_layer, model_name):
	"""Update options for layer and head dropdowns."""
	ctx = dash.callback_context
	trigger_id = ctx.triggered[0]['prop_id'].split('.')[0] if ctx.triggered else None

	if not activation_data or not model_name:
	return [], []

	# Get model config
	try:
	from transformers import AutoConfig
	config = AutoConfig.from_pretrained(model_name)
	num_layers = config.num_hidden_layers
	num_heads = config.num_attention_heads
	except:
	return [], []

	# Update layer options (only if data changed or init)
	layer_options = [{'label': f'Layer {i}', 'value': i} for i in range(num_layers)]

	# Update head options based on selected layer
	head_options = []
	if selected_layer is not None:
	head_options = [{'label': f'Head {i}', 'value': i} for i in range(num_heads)]

	# If only layer changed, return no_update for layer options to avoid flickering
	if trigger_id == 'ablation-layer-select':
	return no_update, head_options

	return layer_options, head_options


	@app.callback(
	[Output('ablation-selected-heads', 'data'),
	Output('run-ablation-btn', 'disabled'),
	Output('ablation-selected-display', 'children'),
	Output('ablation-head-select', 'value')],
	[Input('ablation-add-head-btn', 'n_clicks'),
	Input('clear-ablation-btn', 'n_clicks'),
	Input({'type': 'ablation-remove-btn', 'layer': ALL, 'head': ALL}, 'n_clicks')],
	[State('ablation-layer-select', 'value'),
	State('ablation-head-select', 'value'),
	State('ablation-selected-heads', 'data')],
	prevent_initial_call=True
	)
	def manage_ablation_heads(add_clicks, clear_clicks, remove_clicks,
	layer_val, head_val, selected_heads):
	"""
	Manage the list of selected heads (Add, Clear, Remove).
	"""
	ctx = dash.callback_context
	if not ctx.triggered:
	return no_update, no_update, no_update, no_update

	triggered_id = ctx.triggered[0]['prop_id']

	# Initialize selected_heads
	if selected_heads is None:
	selected_heads = []

	# Handle "Add"
	if 'ablation-add-head-btn' in triggered_id:
	if layer_val is not None and head_val is not None:
	# Check for duplicate
	exists = any(item['layer'] == layer_val and item['head'] == head_val
	for item in selected_heads if isinstance(item, dict))
	if not exists:
	selected_heads.append({'layer': layer_val, 'head': head_val})
	# Sort for cleaner display
	selected_heads.sort(key=lambda x: (x['layer'], x['head']))
	# Clear head selection after add
	return selected_heads, len(selected_heads) == 0, create_selected_heads_display(selected_heads), None

	# Handle "Clear"
	elif 'clear-ablation-btn' in triggered_id:
	return [], True, create_selected_heads_display([]), no_update

	# Handle "Remove" (pattern matching)
	elif 'ablation-remove-btn' in triggered_id:
	# Determine which button was clicked
	# Note: remove_clicks is a list, but we need the id from context
	prop_id = json.loads(triggered_id.split('.')[0])
	rm_layer = prop_id['layer']
	rm_head = prop_id['head']

	selected_heads = [
	item for item in selected_heads
	if not (isinstance(item, dict) and item.get('layer') == rm_layer and item.get('head') == rm_head)
	]
	return selected_heads, len(selected_heads) == 0, create_selected_heads_display(selected_heads), no_update

	return no_update, no_update, no_update, no_update


	@app.callback(
	[Output('ablation-results-container', 'children'),
	Output('session-activation-store', 'data', allow_duplicate=True),
	Output('session-activation-store-original', 'data', allow_duplicate=True)],
	[Input('run-ablation-btn', 'n_clicks')],
	[State('ablation-selected-heads', 'data'),
	State('session-activation-store', 'data'),
	State('model-dropdown', 'value'),
	State('prompt-input', 'value'),
	State('session-selected-beam-store', 'data'),
	State('max-new-tokens-slider', 'value'),
	State('beam-width-slider', 'value')],
	prevent_initial_call=True
	)
	def run_ablation_experiment(n_clicks, selected_heads, activation_data, model_name, prompt, selected_beam, max_new_tokens, beam_width):
	"""Run ablation on ORIGINAL PROMPT and compare results, including beam generation."""
	if not n_clicks or not selected_heads or not activation_data:
	return no_update, no_update, no_update

	try:
	from transformers import AutoModelForCausalLM, AutoTokenizer
	model = AutoModelForCausalLM.from_pretrained(model_name, attn_implementation='eager')
	tokenizer = AutoTokenizer.from_pretrained(model_name)
	model.eval()

	sequence_text = prompt

	config = {
	'attention_modules': activation_data.get('attention_modules', []),
	'block_modules': activation_data.get('block_modules', []),
	'norm_parameters': activation_data.get('norm_parameters', [])
	}

	# Original output
	original_output = activation_data.get('actual_output', {})
	original_token = original_output.get('token', '')
	original_prob = original_output.get('probability', 0)

	# Group heads by layer
	heads_by_layer = {}
	for item in selected_heads:
	if isinstance(item, dict):
	layer = item.get('layer')
	head = item.get('head')
	if layer is not None and head is not None:
	if layer not in heads_by_layer:
	heads_by_layer[layer] = []
	heads_by_layer[layer].append(head)

	if not heads_by_layer:
	return html.Div("No valid heads selected.", style={'color': '#dc3545'}), no_update, no_update

	# Run ablation for generation
	ablated_beam = None
	analysis_text = sequence_text
	try:
	# Always perform beam search during ablation to show comparison
	beam_results = perform_beam_search(
	model, tokenizer, sequence_text,
	beam_width=beam_width,
	max_new_tokens=max_new_tokens,
	ablation_config=heads_by_layer
	)
	if beam_results:
	# Select the top beam
	ablated_beam = {'text': beam_results[0]['text'], 'score': beam_results[0].get('score', 0)}
	analysis_text = ablated_beam['text']
	except Exception as e:
	print(f"Error during ablated generation: {e}")

	# Run ablation for analysis (single pass) on the final generated text
	ablated_data = execute_forward_pass_with_multi_layer_head_ablation(
	model, tokenizer, analysis_text, config, heads_by_layer, original_prompt=prompt
	)

	# Mark as ablated so UI knows
	ablated_data['ablated'] = True

	# Ensure original data has generation info for the comparison display.
	# When no beam was selected (multi-token without "Select for Comparison"),
	# activation_data lacks generated_tokens/per_position_top5.
	original_data_for_display = activation_data
	if not activation_data.get('generated_tokens'):
	original_beam_results = perform_beam_search(
	model, tokenizer, prompt, beam_width, max_new_tokens
	)
	if original_beam_results:
	original_text = original_beam_results[0]['text']
	original_data_for_display = execute_forward_pass(
	model, tokenizer, original_text, config, original_prompt=prompt
	)
	# Auto-populate selected_beam for text display
	if not selected_beam:
	selected_beam = {
	'text': original_text,
	'score': original_beam_results[0].get('score', 0)
	}

	ablated_output = ablated_data.get('actual_output', {})
	ablated_token = ablated_output.get('token', '')
	ablated_prob = ablated_output.get('probability', 0)

	results_display = create_ablation_results_display(
	original_data_for_display, ablated_data,
	selected_heads, selected_beam, ablated_beam
	)

	return results_display, ablated_data, original_data_for_display

	except Exception as e:
	import traceback
	traceback.print_exc()
	return html.Div(f"Ablation error: {str(e)}", style={'color': '#dc3545'}), no_update, no_update


	@app.callback(
	[Output('ablation-original-token-map', 'children'),
	Output('ablation-original-text-box', 'children'),
	Output('ablation-original-top5-chart', 'figure'),
	Output('ablation-ablated-token-map', 'children'),
	Output('ablation-ablated-text-box', 'children'),
	Output('ablation-ablated-top5-chart', 'figure'),
	Output('ablation-divergence-indicator', 'children')],
	[Input('ablation-scrubber-slider', 'value')],
	[State('session-activation-store-original', 'data'),
	State('session-activation-store', 'data')],
	prevent_initial_call=True
	)
	def update_ablation_scrubber(position, original_data, ablated_data):
	if position is None or not original_data or not ablated_data:
	import dash
	return dash.no_update

	from components.ablation_panel import build_token_map, build_text_box, build_chart, build_divergence_indicator

	orig_pos_data = original_data.get('per_position_top5', [])
	abl_pos_data = ablated_data.get('per_position_top5', [])

	orig_tokens = original_data.get('generated_tokens', [])
	abl_tokens = ablated_data.get('generated_tokens', [])

	# Find changed indices
	changed_indices = set()
	for i in range(max(len(orig_tokens), len(abl_tokens))):
	if i >= len(orig_tokens) or i >= len(abl_tokens) or orig_tokens[i] != abl_tokens[i]:
	changed_indices.add(i)

	prompt_text = original_data.get('original_prompt', original_data.get('prompt', ''))

	orig_map = build_token_map(orig_tokens, position, set()) # original doesn't show red 'changed' state
	abl_map = build_token_map(abl_tokens, position, changed_indices)

	orig_text_box = build_text_box(prompt_text, orig_tokens, position, set())
	abl_text_box = build_text_box(prompt_text, abl_tokens, position, changed_indices)

	orig_chart = []
	abl_chart = []

	if position < len(orig_pos_data):
	orig_chart = build_chart(orig_pos_data[position], orig_pos_data[position].get('actual_token'), '#4c51bf')
	if position < len(abl_pos_data):
	abl_chart = build_chart(abl_pos_data[position], abl_pos_data[position].get('actual_token'), '#e53e3e')

	is_diverged = position in changed_indices
	divergence_indicator = build_divergence_indicator(is_diverged)

	return orig_map, orig_text_box, orig_chart, abl_map, abl_text_box, abl_chart, divergence_indicator


	# ============================================================================
	# CALLBACKS: Investigation Panel - Attribution
	# ============================================================================

	@app.callback(
	Output('attribution-target-dropdown', 'options'),
	[Input('session-activation-store', 'data')]
	)
	def update_attribution_target_options(activation_data):
	if not activation_data:
	return []

	global_top5 = activation_data.get('global_top5_tokens', [])
	options = []
	for t in global_top5:
	if isinstance(t, dict):
	options.append({'label': f"{t['token']} ({t['probability']:.1%})", 'value': t['token']})
	else:
	options.append({'label': t[0], 'value': t[0]})
	return options


	@app.callback(
	Output('attribution-results-container', 'children'),
	[Input('run-attribution-btn', 'n_clicks')],
	[State('attribution-method-radio', 'value'),
	State('attribution-target-dropdown', 'value'),
	State('session-activation-store', 'data'),
	State('model-dropdown', 'value'),
	State('prompt-input', 'value')],
	prevent_initial_call=True
	)
	def run_attribution_experiment(n_clicks, method, target_token, activation_data, model_name, prompt):
	if not n_clicks or not activation_data:
	return no_update

	try:
	from transformers import AutoModelForCausalLM, AutoTokenizer
	model = AutoModelForCausalLM.from_pretrained(model_name, attn_implementation='eager')
	tokenizer = AutoTokenizer.from_pretrained(model_name)
	model.eval()

	sequence_text = activation_data.get('prompt', prompt)

	# Get target token ID if specified
	target_token_id = None
	if target_token:
	target_ids = tokenizer.encode(target_token, add_special_tokens=False)
	if target_ids:
	target_token_id = target_ids[-1]

	# Run attribution
	if method == 'integrated':
	attribution_result = compute_integrated_gradients(
	model, tokenizer, sequence_text, target_token_id, n_steps=30
	)
	else:
	attribution_result = compute_simple_gradient_attribution(
	model, tokenizer, sequence_text, target_token_id
	)

	return create_attribution_results_display(
	attribution_result, attribution_result['target_token']
	)

	except Exception as e:
	import traceback
	traceback.print_exc()
	return html.Div(f"Attribution error: {str(e)}", style={'color': '#dc3545'})


	# ============================================================================
	# CALLBACKS: Reset Ablation
	# ============================================================================

	@app.callback(
	Output('reset-ablation-container', 'style'),
	Input('session-activation-store', 'data'),
	prevent_initial_call=False
	)
	def toggle_reset_ablation_button(activation_data):
	if activation_data and activation_data.get('ablated', False):
	return {'display': 'block'}
	return {'display': 'none'}


	@app.callback(
	[Output('session-activation-store', 'data', allow_duplicate=True),
	Output('session-activation-store-original', 'data'),
	Output('model-status', 'children', allow_duplicate=True)],
	Input('reset-ablation-btn', 'n_clicks'),
	[State('session-activation-store-original', 'data')],
	prevent_initial_call=True
	)
	def reset_ablation(n_clicks, original_data):
	if not n_clicks or not original_data:
	return no_update, no_update, no_update

	success_message = html.Div([
	html.I(className="fas fa-undo", style={'marginRight': '8px', 'color': '#28a745'}),
	"Ablation reset"
	], className="status-success")

	return original_data, {}, success_message


	# ============================================================================
	# CALLBACKS: AI Chatbot
	# ============================================================================
	import threading
	import queue

	_chat_stream_queue = queue.Queue()
	_chat_stream_active = False
	_chat_stream_content = ""

	def _background_generate(user_input, chat_history, dashboard_context):
	global _chat_stream_active
	try:
	from utils.rag_utils import build_rag_context
	rag_context = build_rag_context(user_input, top_k=3)
	from utils.openrouter_client import generate_stream
	for chunk in generate_stream(user_input, chat_history, rag_context, dashboard_context):
	_chat_stream_queue.put(chunk)
	except Exception as e:
	_chat_stream_queue.put(f"\n[Error: {str(e)}]")
	finally:
	_chat_stream_active = False


	@app.callback(
	[Output('chat-window', 'style'),
	Output('chat-open-store', 'data'),
	Output('chat-toggle-btn', 'style')],
	[Input('chat-toggle-btn', 'n_clicks'),
	Input('chat-close-btn', 'n_clicks')],
	[State('chat-open-store', 'data')],
	prevent_initial_call=True
	)
	def toggle_chat_window(toggle_clicks, close_clicks, is_open):
	"""Toggle the chat window open/closed."""
	ctx = dash.callback_context
	if not ctx.triggered:
	return no_update, no_update, no_update

	trigger_id = ctx.triggered[0]['prop_id'].split('.')[0]

	# Default toggle button style (visible)
	toggle_visible = {}
	# Hidden toggle button style
	toggle_hidden = {'display': 'none'}

	if trigger_id == 'chat-close-btn':
	return {'display': 'none'}, False, toggle_visible

	# Toggle button clicked
	new_state = not is_open
	if new_state:
	# Open chat, hide toggle button
	return {'display': 'flex'}, True, toggle_hidden
	else:
	# Close chat, show toggle button
	return {'display': 'none'}, False, toggle_visible


	@app.callback(
	Output('chat-history-store', 'data', allow_duplicate=True),
	Input('chat-clear-btn', 'n_clicks'),
	prevent_initial_call=True
	)
	def clear_chat_history(n_clicks):
	"""Clear all chat history."""
	if not n_clicks:
	return no_update
	return []


	@app.callback(
	[Output('chat-messages-list', 'children'),
	Output('chat-history-store', 'data', allow_duplicate=True),
	Output('chat-input', 'value'),
	Output('chat-typing-indicator', 'style'),
	Output('chat-response-interval', 'disabled')],
	[Input('chat-send-btn', 'n_clicks')],
	[State('chat-input', 'value'),
	State('chat-history-store', 'data'),
	State('model-dropdown', 'value'),
	State('prompt-input', 'value'),
	State('session-activation-store', 'data'),
	State('ablation-selected-heads', 'data')],
	prevent_initial_call=True
	)
	def send_chat_message(send_clicks, user_input, chat_history,
	model_name, prompt, activation_data, ablated_heads):
	"""Handle sending a chat message and start stream."""
	global _chat_stream_active, _chat_stream_content

	if not user_input or not user_input.strip():
	return no_update, no_update, no_update, no_update, no_update

	user_input = user_input.strip()

	if chat_history is None:
	chat_history = []

	chat_history.append({'role': 'user', 'content': user_input})
	chat_history.append({'role': 'assistant', 'content': ''})

	dashboard_context = {}
	if model_name: dashboard_context['model'] = model_name
	if prompt: dashboard_context['prompt'] = prompt
	if activation_data:
	actual_output = activation_data.get('actual_output', {})
	if actual_output:
	dashboard_context['predicted_token'] = actual_output.get('token', '')
	dashboard_context['predicted_probability'] = actual_output.get('probability', 0)
	top5 = activation_data.get('global_top5_tokens', [])
	if top5: dashboard_context['top_predictions'] = top5
	if ablated_heads: dashboard_context['ablated_heads'] = ablated_heads

	_chat_stream_content = ""
	while not _chat_stream_queue.empty():
	try: _chat_stream_queue.get_nowait()
	except: pass

	_chat_stream_active = True
	threading.Thread(
	target=_background_generate,
	args=(user_input, chat_history[:-2], dashboard_context),
	daemon=True
	).start()

	messages_ui = render_messages(chat_history[:-1])

	return messages_ui, chat_history, '', {'display': 'flex'}, False


	@app.callback(
	[Output('chat-messages-list', 'children', allow_duplicate=True),
	Output('chat-history-store', 'data', allow_duplicate=True),
	Output('chat-response-interval', 'disabled', allow_duplicate=True),
	Output('chat-typing-indicator', 'style', allow_duplicate=True)],
	[Input('chat-response-interval', 'n_intervals')],
	[State('chat-history-store', 'data')],
	prevent_initial_call=True
	)
	def update_stream(n_intervals, chat_history):
	global _chat_stream_active, _chat_stream_content

	if not chat_history:
	return no_update, no_update, True, no_update

	chunks = []
	while not _chat_stream_queue.empty():
	try:
	chunks.append(_chat_stream_queue.get_nowait())
	except queue.Empty:
	break

	if chunks:
	_chat_stream_content += "".join(chunks)
	if chat_history[-1]['role'] == 'assistant':
	chat_history[-1]['content'] = _chat_stream_content

	messages_ui = render_messages(chat_history)
	return messages_ui, chat_history, False, {'display': 'none'}

	elif not _chat_stream_active:
	return no_update, no_update, True, {'display': 'none'}

	return no_update, no_update, False, {'display': 'flex'}


	@app.callback(
	[Output('chat-messages-list', 'children', allow_duplicate=True),
	Output('chat-history-store', 'data', allow_duplicate=True)],
	Input('chat-history-store', 'data'),
	prevent_initial_call='initial_duplicate' # Allows initial call with allow_duplicate
	)
	def update_messages_from_store(chat_history):
	"""Update message display when history changes (e.g., on page load from localStorage)."""
	from components.chatbot import GREETING_MESSAGE

	# If history is empty (localStorage empty/cleared), inject the greeting
	if not chat_history:
	greeting_history = [{'role': 'assistant', 'content': GREETING_MESSAGE}]
	return render_messages(greeting_history), greeting_history

	# Filter out empty assistant placeholders (used during streaming)
	display_history = [m for m in chat_history if m.get('content')]
	return render_messages(display_history), no_update


	# Client-side callback for scroll down
	app.clientside_callback(
	"""
	function(children) {
	setTimeout(() => {
	const container = document.getElementById('chat-messages-container');
	if (container) {
	container.scrollTop = container.scrollHeight;
	}
	}, 50);
	return window.dash_clientside.no_update;
	}
	""",
	Output('chat-messages-container', 'className'),
	Input('chat-messages-list', 'children'),
	prevent_initial_call=True
	)

	# Client-side callback for copy functionality
	app.clientside_callback(
	"""
	function(n_clicks) {
	if (!n_clicks) return window.dash_clientside.no_update;

	// Find the clicked button and get its data-content attribute
	const triggered = window.dash_clientside.callback_context.triggered;
	if (!triggered \|\| triggered.length === 0) return window.dash_clientside.no_update;

	const propId = triggered[0].prop_id;
	const match = propId.match(/{"index":(\d+),"type":"copy-message-btn"}/);
	if (!match) return window.dash_clientside.no_update;

	const btn = document.querySelector(`[id='{"index":${match[1]},"type":"copy-message-btn"}']`);
	if (!btn) return window.dash_clientside.no_update;

	const content = btn.getAttribute('data-content');
	if (content) {
	navigator.clipboard.writeText(content).then(() => {
	btn.classList.add('copied');
	setTimeout(() => btn.classList.remove('copied'), 2000);
	});
	}

	return window.dash_clientside.no_update;
	}
	""",
	Output('chat-messages-list', 'className'),
	Input({'type': 'copy-message-btn', 'index': ALL}, 'n_clicks'),
	prevent_initial_call=True
	)


	# Client-side callback for Enter key to send message
	app.clientside_callback(
	"""
	function(id) {
	// Set up the event listener only once
	const textarea = document.getElementById('chat-input');
	const sendBtn = document.getElementById('chat-send-btn');

	if (textarea && sendBtn && !textarea._enterListenerAdded) {
	textarea.addEventListener('keydown', function(e) {
	if (e.key === 'Enter' && !e.shiftKey) {
	e.preventDefault();
	sendBtn.click();
	}
	});
	textarea._enterListenerAdded = true;
	}

	return window.dash_clientside.no_update;
	}
	""",
	Output('chat-input', 'className'),
	Input('chat-open-store', 'data'),
	prevent_initial_call=True
	)


	if __name__ == '__main__':
	# Use 0.0.0.0:7860 for Hugging Face Spaces, fallback to localhost:8050 for local dev
	import os
	port = int(os.environ.get("PORT", 7860))
	debug = os.environ.get("DEBUG", "false").lower() == "true"
	app.run(host='0.0.0.0', port=port, debug=debug)