# context_manager.py
import sqlite3
import json
import logging
import uuid
import hashlib
import threading
import time
import os
from pathlib import Path
from contextlib import contextmanager
from datetime import datetime, timedelta
from typing import Dict, Optional, List

logger = logging.getLogger(__name__)


class TransactionManager:
    """Manage database transactions with proper locking"""
    
    def __init__(self, db_path):
        self.db_path = db_path
        self._lock = threading.RLock()
        self._connections = {}
    
    @contextmanager
    def transaction(self, session_id=None):
        """Context manager for database transactions with automatic rollback"""
        conn = None
        cursor = None
        
        try:
            with self._lock:
                conn = sqlite3.connect(self.db_path, isolation_level='IMMEDIATE')
                conn.execute('PRAGMA journal_mode=WAL')  # Write-Ahead Logging for better concurrency
                conn.execute('PRAGMA busy_timeout=5000')  # 5 second timeout for locks
                cursor = conn.cursor()
                
                yield cursor
                
                conn.commit()
                logger.debug(f"Transaction committed for session {session_id}")
                
        except Exception as e:
            if conn:
                conn.rollback()
                logger.error(f"Transaction rolled back for session {session_id}: {e}")
            raise
        finally:
            if conn:
                conn.close()

class EfficientContextManager:
    def __init__(self, llm_router=None, db_path=None):
        self.session_cache = {}  # In-memory for active sessions
        self._session_cache = {}  # Enhanced in-memory cache with timestamps
        self.cache_config = {
            "max_session_size": 10,  # MB per session
            "ttl": 3600,  # 1 hour
            "compression": "gzip",
            "eviction_policy": "LRU"
        }
        # Use provided db_path or get from config/env, default to /tmp for Docker
        if db_path is None:
            try:
                from config import settings
                db_path = settings.db_path
            except (ImportError, AttributeError):
                # Fallback: check environment variable or use /tmp
                # os is already imported at top of file
                db_path = os.getenv("DB_PATH", "/tmp/sessions.db")
        self.db_path = db_path
        # Ensure directory exists
        db_dir = os.path.dirname(self.db_path)
        if db_dir and not os.path.exists(db_dir):
            os.makedirs(db_dir, exist_ok=True)
            logger.info(f"Created database directory: {db_dir}")
        self.llm_router = llm_router  # For generating context summaries
        logger.info(f"Initializing ContextManager with DB path: {self.db_path}")
        self.transaction_manager = TransactionManager(self.db_path)
        self._init_database()
        self.optimize_database_indexes()
    
    def _init_database(self):
        """Initialize database and create tables"""
        try:
            logger.info("Initializing database...")
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            
            # Create sessions table if not exists
            cursor.execute("""
                CREATE TABLE IF NOT EXISTS sessions (
                    session_id TEXT PRIMARY KEY,
                    user_id TEXT DEFAULT 'Test_Any',
                    created_at TIMESTAMP,
                    last_activity TIMESTAMP,
                    context_data TEXT,
                    user_metadata TEXT
                )
            """)
            
            # Add user_id column to existing sessions table if it doesn't exist
            try:
                cursor.execute("ALTER TABLE sessions ADD COLUMN user_id TEXT DEFAULT 'Test_Any'")
                logger.info("✓ Added user_id column to sessions table")
            except sqlite3.OperationalError:
                # Column already exists
                pass
            
            logger.info("✓ Sessions table ready")
            
            # Create interactions table
            cursor.execute("""
                CREATE TABLE IF NOT EXISTS interactions (
                    id INTEGER PRIMARY KEY AUTOINCREMENT,
                    session_id TEXT REFERENCES sessions(session_id),
                    user_input TEXT,
                    context_snapshot TEXT,
                    created_at TIMESTAMP,
                    FOREIGN KEY(session_id) REFERENCES sessions(session_id)
                )
            """)
            logger.info("✓ Interactions table ready")
            
            # Create user_contexts table (persistent user persona summaries)
            cursor.execute("""
                CREATE TABLE IF NOT EXISTS user_contexts (
                    user_id TEXT PRIMARY KEY,
                    persona_summary TEXT,
                    updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
                )
            """)
            logger.info("✓ User contexts table ready")
            
            # Create session_contexts table (session summaries)
            cursor.execute("""
                CREATE TABLE IF NOT EXISTS session_contexts (
                    session_id TEXT PRIMARY KEY,
                    user_id TEXT,
                    session_summary TEXT,
                    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
                    FOREIGN KEY(session_id) REFERENCES sessions(session_id),
                    FOREIGN KEY(user_id) REFERENCES user_contexts(user_id)
                )
            """)
            logger.info("✓ Session contexts table ready")
            
            # Create interaction_contexts table (individual interaction summaries)
            cursor.execute("""
                CREATE TABLE IF NOT EXISTS interaction_contexts (
                    interaction_id TEXT PRIMARY KEY,
                    session_id TEXT,
                    user_input TEXT,
                    system_response TEXT,
                    interaction_summary TEXT,
                    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
                    FOREIGN KEY(session_id) REFERENCES sessions(session_id)
                )
            """)
            logger.info("✓ Interaction contexts table ready")
            
            conn.commit()
            conn.close()
            
            # Update schema with new columns and tables for user change tracking
            self._update_database_schema()
            
            logger.info("Database initialization complete")
            
        except Exception as e:
            logger.error(f"Database initialization error: {e}", exc_info=True)
    
    def _update_database_schema(self):
        """Add missing columns and tables for user change tracking"""
        try:
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            
            # Add needs_refresh column to interaction_contexts
            try:
                cursor.execute("""
                    ALTER TABLE interaction_contexts 
                    ADD COLUMN needs_refresh INTEGER DEFAULT 0
                """)
                logger.info("✓ Added needs_refresh column to interaction_contexts")
            except sqlite3.OperationalError:
                pass  # Column already exists
            
            # Create user change log table
            cursor.execute("""
                CREATE TABLE IF NOT EXISTS user_change_log (
                    id INTEGER PRIMARY KEY AUTOINCREMENT,
                    session_id TEXT,
                    old_user_id TEXT,
                    new_user_id TEXT,
                    timestamp TIMESTAMP,
                    FOREIGN KEY(session_id) REFERENCES sessions(session_id)
                )
            """)
            
            conn.commit()
            conn.close()
            logger.info("✓ Database schema updated successfully for user change tracking")
            
            # Update interactions table for deduplication
            self._update_interactions_table()
            
        except Exception as e:
            logger.error(f"Schema update error: {e}", exc_info=True)
    
    def _update_interactions_table(self):
        """Add interaction_hash column for deduplication"""
        try:
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            
            # Check if column already exists
            cursor.execute("PRAGMA table_info(interactions)")
            columns = [row[1] for row in cursor.fetchall()]
            
            # Add interaction_hash column if it doesn't exist
            if 'interaction_hash' not in columns:
                try:
                    cursor.execute("""
                        ALTER TABLE interactions 
                        ADD COLUMN interaction_hash TEXT
                    """)
                    logger.info("✓ Added interaction_hash column to interactions table")
                except sqlite3.OperationalError:
                    pass  # Column already exists
            
            # Create unique index for deduplication (this enforces uniqueness)
            try:
                cursor.execute("""
                    CREATE UNIQUE INDEX IF NOT EXISTS idx_interaction_hash_unique 
                    ON interactions(interaction_hash)
                """)
                logger.info("✓ Created unique index on interaction_hash")
            except sqlite3.OperationalError:
                # Index might already exist, try non-unique index as fallback
                cursor.execute("""
                    CREATE INDEX IF NOT EXISTS idx_interaction_hash 
                    ON interactions(interaction_hash)
                """)
            
            conn.commit()
            conn.close()
            logger.info("✓ Interactions table updated for deduplication")
            
        except Exception as e:
            logger.error(f"Error updating interactions table: {e}", exc_info=True)
    
    async def manage_context(self, session_id: str, user_input: str, user_id: str = "Test_Any") -> dict:
        """
        Efficient context management with separated session/user caching
        STEP 1: Fetch User Context (if available) 
        STEP 2: Get Previous Interaction Contexts
        STEP 3: Combine for workflow use
        """
        # Use session-only cache key to prevent user_id conflicts
        session_cache_key = f"session_{session_id}"
        user_cache_key = f"user_{user_id}"
        
        # Get session context from cache
        session_context = self._get_from_memory_cache(session_cache_key)
        
        # Check if cached session context matches current user_id
        # Handle both old and new cache formats
        cached_entry = self.session_cache.get(session_cache_key)
        if cached_entry:
            # Extract actual context from cache entry
            if isinstance(cached_entry, dict) and 'value' in cached_entry:
                actual_context = cached_entry.get('value', {})
            else:
                actual_context = cached_entry
            
            if actual_context and actual_context.get("user_id") != user_id:
                # User changed, invalidate session cache
                logger.info(f"User mismatch in cache for session {session_id}, invalidating cache")
                session_context = None
                if session_cache_key in self.session_cache:
                    del self.session_cache[session_cache_key]
            else:
                session_context = actual_context
        
        # Get user context separately
        user_context = self._get_from_memory_cache(user_cache_key)
        
        if not session_context:
            # Retrieve from database with user context
            session_context = await self._retrieve_from_db(session_id, user_input, user_id)
            
            # Step 2: Cache session context with TTL
            self.add_context_cache(session_cache_key, session_context, ttl=self.cache_config.get("ttl", 3600))
        
        # Handle user context separately - load only once and cache thereafter
        # Cache does not refer to database after initial load
        if not user_context or not user_context.get("user_context_loaded"):
            user_context_data = await self.get_user_context(user_id)
            user_context = {
                "user_context": user_context_data,
                "user_context_loaded": True,
                "user_id": user_id
            }
            # Cache user context separately - this is the only database query for user context
            self._warm_memory_cache(user_cache_key, user_context)
            logger.debug(f"User context loaded once for {user_id} and cached")
        else:
            # User context already cached, use it without database query
            logger.debug(f"Using cached user context for {user_id}")
        
        # Merge contexts without duplication
        merged_context = {
            **session_context,
            "user_context": user_context.get("user_context", ""),
            "user_context_loaded": True,
            "user_id": user_id  # Ensure current user_id is used
        }
        
        # Update context with new interaction
        updated_context = self._update_context(merged_context, user_input, user_id=user_id)
        
        return self._optimize_context(updated_context)
    
    async def get_user_context(self, user_id: str) -> str:
        """
        STEP 1: Fetch or generate User Context (500-token persona summary)
        Available for all interactions except first time per user
        """
        try:
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            
            # Check if user context exists
            cursor.execute("""
                SELECT persona_summary FROM user_contexts WHERE user_id = ?
            """, (user_id,))
            
            row = cursor.fetchone()
            if row and row[0]:
                # Existing user context found
                conn.close()
                logger.info(f"✓ User context loaded for {user_id}")
                return row[0]
            
            # Generate new user context from all historical data
            logger.info(f"Generating new user context for {user_id}")
            
            # Fetch all historical Session and Interaction contexts for this user
            all_session_summaries = []
            all_interaction_summaries = []
            
            # Get all session contexts
            cursor.execute("""
                SELECT session_summary FROM session_contexts WHERE user_id = ?
                ORDER BY created_at DESC LIMIT 50
            """, (user_id,))
            for row in cursor.fetchall():
                if row[0]:
                    all_session_summaries.append(row[0])
            
            # Get all interaction contexts
            cursor.execute("""
                SELECT ic.interaction_summary 
                FROM interaction_contexts ic
                JOIN sessions s ON ic.session_id = s.session_id
                WHERE s.user_id = ?
                ORDER BY ic.created_at DESC LIMIT 100
            """, (user_id,))
            for row in cursor.fetchall():
                if row[0]:
                    all_interaction_summaries.append(row[0])
            
            conn.close()
            
            if not all_session_summaries and not all_interaction_summaries:
                # First time user - no context to generate
                logger.info(f"No historical data for {user_id} - first time user")
                return ""
            
            # Generate persona summary using LLM (500 tokens)
            historical_data = "\n\n".join(all_session_summaries + all_interaction_summaries[:20])
            
            if self.llm_router:
                prompt = f"""Generate a concise 500-token persona summary for user {user_id} based on their interaction history:

Historical Context:
{historical_data}

Create a persona summary that captures:
- Communication style and preferences
- Common topics and interests
- Interaction patterns
- Key information shared across sessions

Keep the summary concise and focused (approximately 500 tokens)."""
                
                try:
                    persona_summary = await self.llm_router.route_inference(
                        task_type="general_reasoning",
                        prompt=prompt,
                        max_tokens=500,
                        temperature=0.7
                    )
                    
                    if persona_summary and isinstance(persona_summary, str) and persona_summary.strip():
                        # Store in database
                        conn = sqlite3.connect(self.db_path)
                        cursor = conn.cursor()
                        cursor.execute("""
                            INSERT OR REPLACE INTO user_contexts (user_id, persona_summary, updated_at)
                            VALUES (?, ?, ?)
                        """, (user_id, persona_summary.strip(), datetime.now().isoformat()))
                        conn.commit()
                        conn.close()
                        
                        logger.info(f"✓ Generated and stored user context for {user_id}")
                        return persona_summary.strip()
                except Exception as e:
                    logger.error(f"Error generating user context: {e}", exc_info=True)
            
            # Fallback: Return empty if LLM fails
            logger.warning(f"Could not generate user context for {user_id} - using empty")
            return ""
            
        except Exception as e:
            logger.error(f"Error getting user context: {e}", exc_info=True)
            return ""
    
    async def generate_interaction_context(self, interaction_id: str, session_id: str, 
                                         user_input: str, system_response: str, 
                                         user_id: str = "Test_Any") -> str:
        """
        STEP 2: Generate Interaction Context (50-token summary)
        Called after each response
        """
        try:
            if not self.llm_router:
                return ""
            
            # Use full user input for context generation (not truncated in prompt)
            # Only truncate for display in prompt if extremely long
            user_input_preview = user_input[:500] if len(user_input) > 500 else user_input
            prompt = f"""Summarize this interaction in approximately 50 tokens:

User Input: {user_input_preview}
System Response: {system_response[:500]}

Provide a brief summary capturing the key exchange."""
            
            try:
                summary = await self.llm_router.route_inference(
                    task_type="general_reasoning",
                    prompt=prompt,
                    max_tokens=50,
                    temperature=0.7
                )
                
                if summary and isinstance(summary, str) and summary.strip():
                    # Store in database
                    conn = sqlite3.connect(self.db_path)
                    cursor = conn.cursor()
                    created_at = datetime.now().isoformat()
                    cursor.execute("""
                        INSERT OR REPLACE INTO interaction_contexts 
                        (interaction_id, session_id, user_input, system_response, interaction_summary, created_at)
                        VALUES (?, ?, ?, ?, ?, ?)
                    """, (
                        interaction_id, 
                        session_id, 
                        user_input[:5000],  # Increased from 500 to 5000 characters
                        system_response[:2000],  # Increased from 1000 to 2000
                        summary.strip(),
                        created_at
                    ))
                    conn.commit()
                    conn.close()
                    
                    # Update cache immediately with new interaction context
                    # This ensures cache is synchronized with database at the same time
                    self._update_cache_with_interaction_context(session_id, summary.strip(), created_at)
                    
                    logger.info(f"✓ Generated interaction context for {interaction_id} and updated cache")
                    return summary.strip()
            except Exception as e:
                logger.error(f"Error generating interaction context: {e}", exc_info=True)
            
            # Fallback on LLM failure
            return ""
            
        except Exception as e:
            logger.error(f"Error in generate_interaction_context: {e}", exc_info=True)
            return ""
    
    async def generate_session_context(self, session_id: str, user_id: str = "Test_Any") -> str:
        """
        Generate Session Context (100-token summary) at every turn
        Uses cached interaction contexts instead of querying database
        Updates both database and cache immediately
        """
        try:
            # Get interaction contexts from cache (no database query)
            session_cache_key = f"session_{session_id}"
            cached_context = self.session_cache.get(session_cache_key)
            
            if not cached_context:
                logger.warning(f"No cached context found for session {session_id}, cannot generate session context")
                return ""
            
            interaction_contexts = cached_context.get('interaction_contexts', [])
            
            if not interaction_contexts:
                logger.info(f"No interaction contexts available for session {session_id} to summarize")
                return ""
            
            # Use cached interaction contexts (from cache, not database)
            interaction_summaries = [ic.get('summary', '') for ic in interaction_contexts if ic.get('summary')]
            
            if not interaction_summaries:
                logger.info(f"No interaction summaries available for session {session_id}")
                return ""
            
            # Generate session summary using LLM (100 tokens)
            if self.llm_router:
                combined_context = "\n".join(interaction_summaries)
                
                prompt = f"""Summarize this session's interactions in approximately 100 tokens:

Interaction Summaries:
{combined_context}

Create a concise session summary capturing:
- Main topics discussed
- Key outcomes or information shared
- User's focus areas

Keep the summary concise (approximately 100 tokens)."""
                
                try:
                    session_summary = await self.llm_router.route_inference(
                        task_type="general_reasoning",
                        prompt=prompt,
                        max_tokens=100,
                        temperature=0.7
                    )
                    
                    if session_summary and isinstance(session_summary, str) and session_summary.strip():
                        # Store in database
                        created_at = datetime.now().isoformat()
                        conn = sqlite3.connect(self.db_path)
                        cursor = conn.cursor()
                        cursor.execute("""
                            INSERT OR REPLACE INTO session_contexts 
                            (session_id, user_id, session_summary, created_at)
                            VALUES (?, ?, ?, ?)
                        """, (session_id, user_id, session_summary.strip(), created_at))
                        conn.commit()
                        conn.close()
                        
                        # Update cache immediately with new session context
                        # This ensures cache is synchronized with database at the same time
                        self._update_cache_with_session_context(session_id, session_summary.strip(), created_at)
                        
                        logger.info(f"✓ Generated session context for {session_id} and updated cache")
                        return session_summary.strip()
                except Exception as e:
                    logger.error(f"Error generating session context: {e}", exc_info=True)
            
            # Fallback on LLM failure
            return ""
            
        except Exception as e:
            logger.error(f"Error in generate_session_context: {e}", exc_info=True)
            return ""
    
    async def end_session(self, session_id: str, user_id: str = "Test_Any"):
        """
        End session and clear cache
        Note: Session context is already generated at every turn, so this just clears cache
        """
        try:
            # Session context is already generated at every turn (no need to regenerate)
            # Clear in-memory cache for this session (session-only key)
            session_cache_key = f"session_{session_id}"
            if session_cache_key in self.session_cache:
                del self.session_cache[session_cache_key]
                logger.info(f"✓ Cleared cache for session {session_id}")
            
        except Exception as e:
            logger.error(f"Error ending session: {e}", exc_info=True)
    
    def _clear_user_cache_on_change(self, session_id: str, new_user_id: str, old_user_id: str):
        """Clear cache entries when user changes"""
        if new_user_id != old_user_id:
            # Clear old composite cache keys
            old_cache_key = f"{session_id}_{old_user_id}"
            if old_cache_key in self.session_cache:
                del self.session_cache[old_cache_key]
                logger.info(f"Cleared old cache for user {old_user_id} on session {session_id}")
    
    def _optimize_context(self, context: dict, relevance_classification: Optional[Dict] = None) -> dict:
        """
        Optimize context for LLM consumption with relevance filtering support
        Format: [Session Context] + [User Context (conditional)] + [Interaction Context #N, #N-1, ...]
        
        Args:
            context: Base context dictionary
            relevance_classification: Optional relevance classification results with dynamic user context
        
        Applies smart pruning before formatting.
        """
        # Step 4: Prune context if it exceeds token limits (uses config threshold)
        pruned_context = self.prune_context(context)
        
        # Get context mode (fresh or relevant)
        session_id = pruned_context.get("session_id")
        context_mode = self.get_context_mode(session_id)
        
        interaction_contexts = pruned_context.get("interaction_contexts", [])
        session_context = pruned_context.get("session_context", {})
        session_summary = session_context.get("summary", "") if isinstance(session_context, dict) else ""
        
        # MODIFIED: Conditional user context inclusion based on mode and relevance
        user_context = ""
        if context_mode == 'relevant' and relevance_classification:
            # Use dynamic relevant summaries from relevance classification
            user_context = relevance_classification.get('combined_user_context', '')
            
            if user_context:
                logger.info(
                    f"Using dynamic relevant context: {len(relevance_classification.get('relevant_summaries', []))} "
                    f"sessions summarized for session {session_id}"
                )
        elif context_mode == 'relevant' and not relevance_classification:
            # Fallback: Use traditional user context if relevance classification unavailable
            user_context = pruned_context.get("user_context", "")
            logger.debug(f"Relevant mode but no classification, using traditional user context")
        # If context_mode == 'fresh', user_context remains empty (no user context)
        
        # Format interaction contexts as requested
        formatted_interactions = []
        for idx, ic in enumerate(interaction_contexts[:10]):  # Last 10 interactions
            formatted_interactions.append(f"[Interaction Context #{len(interaction_contexts) - idx}]\n{ic.get('summary', '')}")
        
        # Combine Session Context + (Conditional) User Context + Interaction Contexts
        combined_context = ""
        if session_summary:
            combined_context += f"[Session Context]\n{session_summary}\n\n"
        
        # Include user context only if available and in relevant mode
        if user_context:
            context_label = "[Relevant User Context]" if context_mode == 'relevant' else "[User Context]"
            combined_context += f"{context_label}\n{user_context}\n\n"
        
        if formatted_interactions:
            combined_context += "\n\n".join(formatted_interactions)
        
        return {
            "session_id": pruned_context.get("session_id"),
            "user_id": pruned_context.get("user_id", "Test_Any"),
            "user_context": user_context,  # Dynamic summaries OR empty
            "session_context": session_context,
            "interaction_contexts": interaction_contexts,
            "combined_context": combined_context,
            "context_mode": context_mode,  # Include mode for debugging
            "relevance_metadata": relevance_classification.get('relevance_scores', {}) if relevance_classification else {},
            "preferences": pruned_context.get("preferences", {}),
            "active_tasks": pruned_context.get("active_tasks", []),
            "last_activity": pruned_context.get("last_activity")
        }
    
    def _get_from_memory_cache(self, cache_key: str) -> dict:
        """
        Retrieve context from in-memory session cache with expiration check
        """
        cached = self.session_cache.get(cache_key)
        if not cached:
            return None
        
        # Check if it's the new format with expiration
        if isinstance(cached, dict) and 'value' in cached:
            # New format with TTL
            if self._is_cache_expired(cached):
                # Remove expired cache entry
                del self.session_cache[cache_key]
                logger.debug(f"Cache expired for key: {cache_key}")
                return None
            return cached.get('value')
        else:
            # Old format (direct value) - return as-is for backward compatibility
            return cached
    
    def _is_cache_expired(self, cache_entry: dict) -> bool:
        """
        Check if cache entry has expired based on TTL
        """
        if not isinstance(cache_entry, dict):
            return True
        
        expires = cache_entry.get('expires')
        if not expires:
            return False  # No expiration set, consider valid
        
        return time.time() > expires
    
    def add_context_cache(self, key: str, value: dict, ttl: int = 3600):
        """
        Step 2: Implement Context Caching with TTL expiration
        
        Add context to cache with expiration time.
        
        Args:
            key: Cache key
            value: Value to cache (dict)
            ttl: Time to live in seconds (default 3600 = 1 hour)
        """
        import time
        self.session_cache[key] = {
            'value': value,
            'expires': time.time() + ttl,
            'timestamp': time.time()
        }
        logger.debug(f"Cached context for key: {key} with TTL: {ttl}s")
    
    def get_token_count(self, text: str) -> int:
        """
        Approximate token count for text (4 characters ≈ 1 token)
        
        Args:
            text: Text to count tokens for
            
        Returns:
            Approximate token count
        """
        if not text:
            return 0
        # Simple approximation: 4 characters per token
        return len(text) // 4
    
    def prune_context(self, context: dict, max_tokens: Optional[int] = None) -> dict:
        """
        Step 4: Implement Smart Context Pruning with configurable threshold
        
        Prune context to stay within token limit while keeping most recent and relevant content.
        
        Args:
            context: Context dictionary to prune
            max_tokens: Maximum token count (uses config default if None)
            
        Returns:
            Pruned context dictionary
        """
        # Use config threshold if not provided
        if max_tokens is None:
            try:
                from .config import get_settings
                settings = get_settings()
                max_tokens = settings.context_pruning_threshold
                logger.debug(f"Using config pruning threshold: {max_tokens} tokens")
            except Exception:
                max_tokens = 2000  # Fallback to default
                logger.warning("Could not load config, using default pruning threshold: 2000")
        
        try:
            # Calculate current token count
            current_tokens = self._calculate_context_tokens(context)
            
            if current_tokens <= max_tokens:
                return context  # No pruning needed
            
            logger.info(f"Context token count ({current_tokens}) exceeds limit ({max_tokens}), pruning...")
            
            # Create a copy to avoid modifying original
            pruned_context = context.copy()
            
            # Priority: Keep most recent interactions + session context + user context
            interaction_contexts = pruned_context.get('interaction_contexts', [])
            session_context = pruned_context.get('session_context', {})
            user_context = pruned_context.get('user_context', '')
            
            # Keep user context and session context (essential)
            essential_tokens = (
                self.get_token_count(user_context) + 
                self.get_token_count(str(session_context))
            )
            
            # Calculate how many interaction contexts we can keep
            available_tokens = max_tokens - essential_tokens
            if available_tokens < 0:
                # Essential context itself is too large - summarize user context
                if self.get_token_count(user_context) > max_tokens // 2:
                    pruned_context['user_context'] = user_context[:max_tokens * 2]  # Rough cut
                    logger.warning(f"User context too large, truncated")
                return pruned_context
            
            # Keep most recent interactions that fit in token budget
            kept_interactions = []
            current_size = 0
            
            for interaction in interaction_contexts:
                summary = interaction.get('summary', '')
                interaction_tokens = self.get_token_count(summary)
                
                if current_size + interaction_tokens <= available_tokens:
                    kept_interactions.append(interaction)
                    current_size += interaction_tokens
                else:
                    break  # Can't fit any more
            
            pruned_context['interaction_contexts'] = kept_interactions
            
            logger.info(f"Pruned context: kept {len(kept_interactions)}/{len(interaction_contexts)} interactions, "
                       f"reduced from {current_tokens} to {self._calculate_context_tokens(pruned_context)} tokens")
            
            return pruned_context
            
        except Exception as e:
            logger.error(f"Error pruning context: {e}", exc_info=True)
            return context  # Return original on error
    
    def _calculate_context_tokens(self, context: dict) -> int:
        """Calculate total token count for context"""
        total = 0
        
        # Count tokens in each component
        user_context = context.get('user_context', '')
        total += self.get_token_count(str(user_context))
        
        session_context = context.get('session_context', {})
        if isinstance(session_context, dict):
            total += self.get_token_count(str(session_context.get('summary', '')))
        else:
            total += self.get_token_count(str(session_context))
        
        interaction_contexts = context.get('interaction_contexts', [])
        for interaction in interaction_contexts:
            summary = interaction.get('summary', '')
            total += self.get_token_count(str(summary))
        
        return total
    
    async def _retrieve_from_db(self, session_id: str, user_input: str, user_id: str = "Test_Any") -> dict:
        """
        Retrieve session context with proper user_id synchronization
        Uses transactions to ensure atomic updates of database and cache
        """
        conn = None
        try:
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            
            # Use transaction to ensure atomic updates
            cursor.execute("BEGIN TRANSACTION")
            
            # Get session data (SQLite doesn't support FOR UPDATE, but transaction ensures consistency)
            cursor.execute("""
                SELECT context_data, user_metadata, last_activity, user_id
                FROM sessions 
                WHERE session_id = ?
            """, (session_id,))
            
            row = cursor.fetchone()
            
            if row:
                context_data = json.loads(row[0]) if row[0] else {}
                user_metadata = json.loads(row[1]) if row[1] else {}
                last_activity = row[2]
                session_user_id = row[3] if len(row) > 3 else user_id
                
                # Check for user_id change and update atomically
                user_changed = False
                if session_user_id != user_id:
                    logger.info(f"User change detected: {session_user_id} -> {user_id} for session {session_id}")
                    user_changed = True
                    
                    # Update session with new user_id
                    cursor.execute("""
                        UPDATE sessions 
                        SET user_id = ?, last_activity = ?
                        WHERE session_id = ?
                    """, (user_id, datetime.now().isoformat(), session_id))
                    
                    # Clear any cached interaction contexts for old user by marking for refresh
                    try:
                        cursor.execute("""
                            UPDATE interaction_contexts
                            SET needs_refresh = 1
                            WHERE session_id = ?
                        """, (session_id,))
                    except sqlite3.OperationalError:
                        # Column might not exist yet, will be created by schema update
                        pass
                    
                    # Log user change event
                    try:
                        cursor.execute("""
                            INSERT INTO user_change_log (session_id, old_user_id, new_user_id, timestamp)
                            VALUES (?, ?, ?, ?)
                        """, (session_id, session_user_id, user_id, datetime.now().isoformat()))
                    except sqlite3.OperationalError:
                        # Table might not exist yet, will be created by schema update
                        pass
                    
                    # Clear old cache entries when user changes
                    self._clear_user_cache_on_change(session_id, user_id, session_user_id)
                
                cursor.execute("COMMIT")
                
                # Get interaction contexts with refresh flag check
                try:
                    cursor.execute("""
                        SELECT interaction_summary, created_at, needs_refresh
                        FROM interaction_contexts
                        WHERE session_id = ? AND (needs_refresh IS NULL OR needs_refresh = 0)
                        ORDER BY created_at DESC
                        LIMIT 20
                    """, (session_id,))
                except sqlite3.OperationalError:
                    # Column might not exist yet, fall back to query without needs_refresh
                    cursor.execute("""
                        SELECT interaction_summary, created_at
                        FROM interaction_contexts
                        WHERE session_id = ?
                        ORDER BY created_at DESC
                        LIMIT 20
                    """, (session_id,))
                
                interaction_contexts = []
                for ic_row in cursor.fetchall():
                    # Handle both query formats (with and without needs_refresh)
                    if len(ic_row) >= 2:
                        summary = ic_row[0]
                        timestamp = ic_row[1]
                        needs_refresh = ic_row[2] if len(ic_row) > 2 else 0
                        
                        if summary and not needs_refresh:
                            interaction_contexts.append({
                                "summary": summary,
                                "timestamp": timestamp
                            })
                
                # Get session context from database
                session_context_data = None
                try:
                    cursor.execute("""
                        SELECT session_summary, created_at
                        FROM session_contexts
                        WHERE session_id = ?
                        ORDER BY created_at DESC
                        LIMIT 1
                    """, (session_id,))
                    sc_row = cursor.fetchone()
                    if sc_row and sc_row[0]:
                        session_context_data = {
                            "summary": sc_row[0],
                            "timestamp": sc_row[1]
                        }
                except sqlite3.OperationalError:
                    # Table might not exist yet
                    pass
                
                context = {
                    "session_id": session_id,
                    "user_id": user_id,
                    "interaction_contexts": interaction_contexts,
                    "session_context": session_context_data,
                    "preferences": user_metadata.get("preferences", {}),
                    "active_tasks": user_metadata.get("active_tasks", []),
                    "last_activity": last_activity,
                    "user_context_loaded": False,
                    "user_changed": user_changed
                }
                
                conn.close()
                return context
            else:
                # Create new session with transaction
                cursor.execute("""
                    INSERT INTO sessions (session_id, user_id, created_at, last_activity, context_data, user_metadata)
                    VALUES (?, ?, ?, ?, ?, ?)
                """, (session_id, user_id, datetime.now().isoformat(), datetime.now().isoformat(), "{}", "{}"))
                
                cursor.execute("COMMIT")
                conn.close()
                
                return {
                    "session_id": session_id,
                    "user_id": user_id,
                    "interaction_contexts": [],
                    "session_context": None,
                    "preferences": {},
                    "active_tasks": [],
                    "user_context_loaded": False,
                    "user_changed": False
                }
                
        except sqlite3.Error as e:
            logger.error(f"Database transaction error: {e}", exc_info=True)
            if conn:
                try:
                    conn.rollback()
                except:
                    pass
                conn.close()
            # Return safe fallback
            return {
                "session_id": session_id,
                "user_id": user_id,
                "interaction_contexts": [],
                "session_context": None,
                "preferences": {},
                "active_tasks": [],
                "user_context_loaded": False,
                "error": str(e),
                "user_changed": False
            }
        except Exception as e:
            logger.error(f"Database retrieval error: {e}", exc_info=True)
            if conn:
                try:
                    conn.rollback()
                except:
                    pass
                conn.close()
            # Return safe fallback
            return {
                "session_id": session_id,
                "user_id": user_id,
                "interaction_contexts": [],
                "session_context": None,
                "preferences": {},
                "active_tasks": [],
                "user_context_loaded": False,
                "error": str(e),
                "user_changed": False
            }
    
    def _warm_memory_cache(self, cache_key: str, context: dict):
        """
        Warm the in-memory cache with retrieved context
        Note: Use add_context_cache() instead for TTL support
        """
        # Use add_context_cache for consistency with TTL
        self.add_context_cache(cache_key, context, ttl=self.cache_config.get("ttl", 3600))
    
    def _update_cache_with_interaction_context(self, session_id: str, interaction_summary: str, created_at: str):
        """
        Update cache with new interaction context immediately after database update
        This keeps cache synchronized with database without requiring database queries
        """
        session_cache_key = f"session_{session_id}"
        
        # Get current cached context if it exists
        cached_context = self.session_cache.get(session_cache_key)
        
        if cached_context:
            # Add new interaction context to the beginning of the list (most recent first)
            interaction_contexts = cached_context.get('interaction_contexts', [])
            new_interaction = {
                "summary": interaction_summary,
                "timestamp": created_at
            }
            # Insert at beginning and keep only last 20 (matches DB query limit)
            interaction_contexts.insert(0, new_interaction)
            interaction_contexts = interaction_contexts[:20]
            
            # Update cached context with new interaction contexts
            cached_context['interaction_contexts'] = interaction_contexts
            self.session_cache[session_cache_key] = cached_context
            
            logger.debug(f"Cache updated with new interaction context for session {session_id} (total: {len(interaction_contexts)})")
        else:
            # If cache doesn't exist, create new entry
            new_context = {
                "session_id": session_id,
                "interaction_contexts": [{
                    "summary": interaction_summary,
                    "timestamp": created_at
                }],
                "preferences": {},
                "active_tasks": [],
                "user_context_loaded": False
            }
            self.session_cache[session_cache_key] = new_context
            logger.debug(f"Created new cache entry with interaction context for session {session_id}")
    
    def _update_cache_with_session_context(self, session_id: str, session_summary: str, created_at: str):
        """
        Update cache with new session context immediately after database update
        This keeps cache synchronized with database without requiring database queries
        """
        session_cache_key = f"session_{session_id}"
        
        # Get current cached context if it exists
        cached_context = self.session_cache.get(session_cache_key)
        
        if cached_context:
            # Update session context in cache
            cached_context['session_context'] = {
                "summary": session_summary,
                "timestamp": created_at
            }
            self.session_cache[session_cache_key] = cached_context
            
            logger.debug(f"Cache updated with new session context for session {session_id}")
        else:
            # If cache doesn't exist, create new entry
            new_context = {
                "session_id": session_id,
                "session_context": {
                    "summary": session_summary,
                    "timestamp": created_at
                },
                "interaction_contexts": [],
                "preferences": {},
                "active_tasks": [],
                "user_context_loaded": False
            }
            self.session_cache[session_cache_key] = new_context
            logger.debug(f"Created new cache entry with session context for session {session_id}")
    
    def _update_context(self, context: dict, user_input: str, response: str = None, user_id: str = "Test_Any") -> dict:
        """
        Update context with deduplication and idempotency checks
        Prevents duplicate context updates using interaction hashes
        """
        try:
            # Generate unique interaction hash to prevent duplicates
            interaction_hash = self._generate_interaction_hash(user_input, context["session_id"], user_id)
            
            # Check if this interaction was already processed
            if self._is_duplicate_interaction(interaction_hash):
                logger.info(f"Duplicate interaction detected, skipping update: {interaction_hash[:8]}")
                return context
            
            # Use transaction for atomic updates
            current_time = datetime.now().isoformat()
            with self.transaction_manager.transaction(context["session_id"]) as cursor:
                # Update session activity (only if last_activity is older to prevent unnecessary updates)
                cursor.execute("""
                    UPDATE sessions 
                    SET last_activity = ?, user_id = ?
                    WHERE session_id = ? AND (last_activity IS NULL OR last_activity < ?)
                """, (current_time, user_id, context["session_id"], current_time))
                
                # Store interaction with duplicate prevention using INSERT OR IGNORE
                session_context = {
                    "preferences": context.get("preferences", {}),
                    "active_tasks": context.get("active_tasks", [])
                }
                
                cursor.execute("""
                    INSERT OR IGNORE INTO interactions (
                        interaction_hash,
                        session_id, 
                        user_input, 
                        context_snapshot, 
                        created_at
                    ) VALUES (?, ?, ?, ?, ?)
                """, (
                    interaction_hash,
                    context["session_id"],
                    user_input,
                    json.dumps(session_context),
                    current_time
                ))
            
            # Mark interaction as processed (outside transaction)
            self._mark_interaction_processed(interaction_hash)
            
            # Update in-memory context
            context["last_interaction"] = user_input
            context["last_update"] = current_time
            
            logger.info(f"Context updated for session {context['session_id']} with hash {interaction_hash[:8]}")
            
            return context
            
        except Exception as e:
            logger.error(f"Error updating context: {e}", exc_info=True)
            return context
    
    def _generate_interaction_hash(self, user_input: str, session_id: str, user_id: str) -> str:
        """Generate unique hash for interaction to prevent duplicates"""
        # Use session_id, user_id, and user_input for exact duplicate detection
        # Normalize user input by stripping whitespace
        normalized_input = user_input.strip()
        content = f"{session_id}:{user_id}:{normalized_input}"
        return hashlib.sha256(content.encode()).hexdigest()
    
    def _is_duplicate_interaction(self, interaction_hash: str) -> bool:
        """Check if interaction was already processed"""
        # Keep a rolling window of recent interaction hashes in memory
        if not hasattr(self, '_processed_interactions'):
            self._processed_interactions = set()
        
        # Check in-memory cache first
        if interaction_hash in self._processed_interactions:
            return True
        
        # Also check database for persistent duplicates
        try:
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            # Check if interaction_hash column exists and query for duplicates
            cursor.execute("PRAGMA table_info(interactions)")
            columns = [row[1] for row in cursor.fetchall()]
            if 'interaction_hash' in columns:
                cursor.execute("""
                    SELECT COUNT(*) FROM interactions 
                    WHERE interaction_hash IS NOT NULL AND interaction_hash = ?
                """, (interaction_hash,))
                count = cursor.fetchone()[0]
                conn.close()
                return count > 0
            else:
                conn.close()
                return False
        except sqlite3.OperationalError:
            # Column might not exist yet, only check in-memory
            return interaction_hash in self._processed_interactions
    
    def _mark_interaction_processed(self, interaction_hash: str):
        """Mark interaction as processed"""
        if not hasattr(self, '_processed_interactions'):
            self._processed_interactions = set()
        self._processed_interactions.add(interaction_hash)
        
        # Limit memory usage by keeping only last 1000 hashes
        if len(self._processed_interactions) > 1000:
            # Keep most recent 500 entries (simple truncation)
            self._processed_interactions = set(list(self._processed_interactions)[-500:])
    
    async def manage_context_optimized(self, session_id: str, user_input: str, user_id: str = "Test_Any") -> dict:
        """
        Efficient context management with transaction optimization
        """
        # Use session-only cache key
        session_cache_key = f"session_{session_id}"
        
        # Try to get from cache first (no DB access)
        cached_context = self._get_from_memory_cache(session_cache_key)
        if cached_context and self._is_cache_valid(cached_context):
            logger.debug(f"Using cached context for session {session_id}")
            return cached_context
        
        # Use transaction for all DB operations
        with self.transaction_manager.transaction(session_id) as cursor:
            # Atomic session retrieval and update
            cursor.execute("""
                SELECT s.context_data, s.user_metadata, s.last_activity, s.user_id,
                       COUNT(ic.interaction_id) as interaction_count
                FROM sessions s
                LEFT JOIN interaction_contexts ic ON s.session_id = ic.session_id
                WHERE s.session_id = ?
                GROUP BY s.session_id
            """, (session_id,))
            
            row = cursor.fetchone()
            
            if row:
                # Parse existing session data
                context_data = json.loads(row[0] or '{}')
                user_metadata = json.loads(row[1] or '{}')
                last_activity = row[2]
                stored_user_id = row[3] or user_id
                interaction_count = row[4] or 0
                
                # Handle user change atomically
                if stored_user_id != user_id:
                    self._handle_user_change_atomic(cursor, session_id, stored_user_id, user_id)
                
                # Get interaction contexts efficiently
                interaction_contexts = self._get_interaction_contexts_atomic(cursor, session_id)
                
            else:
                # Create new session atomically
                cursor.execute("""
                    INSERT INTO sessions (session_id, user_id, created_at, last_activity, context_data, user_metadata)
                    VALUES (?, ?, datetime('now'), datetime('now'), '{}', '{}')
                """, (session_id, user_id))
                
                context_data = {}
                user_metadata = {}
                interaction_contexts = []
                interaction_count = 0
        
        # Load user context asynchronously (outside transaction)
        user_context = await self._load_user_context_async(user_id)
        
        # Build final context
        final_context = {
            "session_id": session_id,
            "user_id": user_id,
            "interaction_contexts": interaction_contexts,
            "user_context": user_context,
            "preferences": user_metadata.get("preferences", {}),
            "active_tasks": user_metadata.get("active_tasks", []),
            "interaction_count": interaction_count,
            "cache_timestamp": datetime.now().isoformat()
        }
        
        # Update cache
        self._warm_memory_cache(session_cache_key, final_context)
        
        return self._optimize_context(final_context)
    
    def _handle_user_change_atomic(self, cursor, session_id: str, old_user_id: str, new_user_id: str):
        """Handle user change within transaction"""
        logger.info(f"Handling user change in transaction: {old_user_id} -> {new_user_id}")
        
        # Update session
        cursor.execute("""
            UPDATE sessions 
            SET user_id = ?, last_activity = datetime('now')
            WHERE session_id = ?
        """, (new_user_id, session_id))
        
        # Log the change
        try:
            cursor.execute("""
                INSERT INTO user_change_log (session_id, old_user_id, new_user_id, timestamp)
                VALUES (?, ?, ?, datetime('now'))
            """, (session_id, old_user_id, new_user_id))
        except sqlite3.OperationalError:
            # Table might not exist yet
            pass
        
        # Invalidate related caches
        try:
            cursor.execute("""
                UPDATE interaction_contexts
                SET needs_refresh = 1
                WHERE session_id = ?
            """, (session_id,))
        except sqlite3.OperationalError:
            # Column might not exist yet
            pass
    
    def _get_interaction_contexts_atomic(self, cursor, session_id: str, limit: int = 20):
        """Get interaction contexts within transaction"""
        try:
            cursor.execute("""
                SELECT interaction_summary, created_at, interaction_id
                FROM interaction_contexts
                WHERE session_id = ? AND (needs_refresh IS NULL OR needs_refresh = 0)
                ORDER BY created_at DESC
                LIMIT ?
            """, (session_id, limit))
        except sqlite3.OperationalError:
            # Fallback if needs_refresh column doesn't exist
            cursor.execute("""
                SELECT interaction_summary, created_at, interaction_id
                FROM interaction_contexts
                WHERE session_id = ?
                ORDER BY created_at DESC
                LIMIT ?
            """, (session_id, limit))
        
        contexts = []
        for row in cursor.fetchall():
            if row[0]:
                contexts.append({
                    "summary": row[0],
                    "timestamp": row[1],
                    "id": row[2] if len(row) > 2 else None
                })
        
        return contexts
    
    async def _load_user_context_async(self, user_id: str):
        """Load user context asynchronously to avoid blocking"""
        try:
            # Check memory cache first
            user_cache_key = f"user_{user_id}"
            cached = self._get_from_memory_cache(user_cache_key)
            if cached:
                return cached.get("user_context", "")
            
            # Load from database
            return await self.get_user_context(user_id)
        except Exception as e:
            logger.error(f"Error loading user context: {e}")
            return ""
    
    def _is_cache_valid(self, cached_context: dict, max_age_seconds: int = 60) -> bool:
        """Check if cached context is still valid"""
        if not cached_context:
            return False
        
        cache_timestamp = cached_context.get("cache_timestamp")
        if not cache_timestamp:
            return False
        
        try:
            cache_time = datetime.fromisoformat(cache_timestamp)
            age = (datetime.now() - cache_time).total_seconds()
            return age < max_age_seconds
        except:
            return False
    
    def invalidate_session_cache(self, session_id: str):
        """
        Invalidate cached context for a session to force fresh retrieval
        Only affects cache management - does not change application functionality
        """
        session_cache_key = f"session_{session_id}"
        if session_cache_key in self.session_cache:
            del self.session_cache[session_cache_key]
            logger.info(f"Cache invalidated for session {session_id} to ensure fresh context retrieval")
    
    def optimize_database_indexes(self):
        """Create database indexes for better query performance"""
        try:
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            
            # Create indexes for frequently queried columns
            indexes = [
                "CREATE INDEX IF NOT EXISTS idx_sessions_user_id ON sessions(user_id)",
                "CREATE INDEX IF NOT EXISTS idx_sessions_last_activity ON sessions(last_activity)",
                "CREATE INDEX IF NOT EXISTS idx_interactions_session_id ON interactions(session_id)",
                "CREATE INDEX IF NOT EXISTS idx_interaction_contexts_session_id ON interaction_contexts(session_id)",
                "CREATE INDEX IF NOT EXISTS idx_interaction_contexts_created_at ON interaction_contexts(created_at)",
                "CREATE INDEX IF NOT EXISTS idx_user_change_log_session_id ON user_change_log(session_id)",
                "CREATE INDEX IF NOT EXISTS idx_user_contexts_updated_at ON user_contexts(updated_at)"
            ]
            
            for index in indexes:
                try:
                    cursor.execute(index)
                except sqlite3.OperationalError as e:
                    # Table might not exist yet, skip this index
                    logger.debug(f"Skipping index creation (table may not exist): {e}")
            
            # Analyze database for query optimization
            try:
                cursor.execute("ANALYZE")
            except sqlite3.OperationalError:
                # ANALYZE might not be available in all SQLite versions
                pass
            
            conn.commit()
            conn.close()
            
            logger.info("✓ Database indexes optimized successfully")
            
        except Exception as e:
            logger.error(f"Error optimizing database indexes: {e}", exc_info=True)
    
    def set_context_mode(self, session_id: str, mode: str, user_id: str = "Test_Any"):
        """
        Set context mode for session (fresh or relevant)
        
        Args:
            session_id: Session identifier
            mode: 'fresh' (no user context) or 'relevant' (only relevant context)
            user_id: User identifier
        
        Returns:
            bool: True if successful, False otherwise
        """
        try:
            import time
            
            # VALIDATION: Ensure mode is valid
            if mode not in ['fresh', 'relevant']:
                logger.warning(f"Invalid context mode '{mode}', defaulting to 'fresh'")
                mode = 'fresh'
            
            # Get or create cache entry
            cache_key = f"session_{session_id}"
            cached_context = self._get_from_memory_cache(cache_key)
            
            if not cached_context:
                cached_context = {
                    'session_id': session_id,
                    'user_id': user_id,
                    'preferences': {},
                    'context_mode': mode,
                    'context_mode_timestamp': time.time()
                }
            else:
                # Update existing context (preserve other data)
                cached_context['context_mode'] = mode
                cached_context['context_mode_timestamp'] = time.time()
                cached_context['user_id'] = user_id  # Update user_id if changed
            
            # Update cache with TTL
            self.add_context_cache(cache_key, cached_context, ttl=3600)
            
            logger.info(f"Context mode set to '{mode}' for session {session_id} (user: {user_id})")
            return True
            
        except Exception as e:
            logger.error(f"Error setting context mode: {e}", exc_info=True)
            return False  # Failure doesn't break existing flow
    
    def get_context_mode(self, session_id: str) -> str:
        """
        Get current context mode for session
        
        Args:
            session_id: Session identifier
        
        Returns:
            str: 'fresh' or 'relevant' (default: 'fresh')
        """
        try:
            cache_key = f"session_{session_id}"
            cached_context = self._get_from_memory_cache(cache_key)
            
            if cached_context:
                mode = cached_context.get('context_mode', 'fresh')
                # VALIDATION: Ensure mode is still valid
                if mode in ['fresh', 'relevant']:
                    return mode
                else:
                    logger.warning(f"Invalid cached mode '{mode}', resetting to 'fresh'")
                    cached_context['context_mode'] = 'fresh'
                    import time
                    cached_context['context_mode_timestamp'] = time.time()
                    self.add_context_cache(cache_key, cached_context, ttl=3600)
                    return 'fresh'
            
            # Default for new sessions
            return 'fresh'
            
        except Exception as e:
            logger.error(f"Error getting context mode: {e}", exc_info=True)
            return 'fresh'  # Safe default - no degradation
    
    async def get_all_user_sessions(self, user_id: str) -> List[Dict]:
        """
        Fetch all session contexts for a user (for relevance classification)
        
        Performance: Single database query with JOIN
        
        Args:
            user_id: User identifier
        
        Returns:
            List of session context dictionaries with summaries and interactions
        """
        try:
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            
            # Fetch all session contexts for user with interaction summaries
            cursor.execute("""
                SELECT DISTINCT 
                    sc.session_id, 
                    sc.session_summary, 
                    sc.created_at,
                    (SELECT GROUP_CONCAT(ic.interaction_summary, ' ||| ')
                     FROM interaction_contexts ic
                     WHERE ic.session_id = sc.session_id
                     ORDER BY ic.created_at DESC
                     LIMIT 10) as recent_interactions
                FROM session_contexts sc
                JOIN sessions s ON sc.session_id = s.session_id
                WHERE s.user_id = ?
                ORDER BY sc.created_at DESC
                LIMIT 50
            """, (user_id,))
            
            sessions = []
            for row in cursor.fetchall():
                session_id, session_summary, created_at, interactions_str = row
                
                # Parse interaction summaries
                interaction_list = []
                if interactions_str:
                    for summary in interactions_str.split(' ||| '):
                        if summary.strip():
                            interaction_list.append({
                                'summary': summary.strip(),
                                'timestamp': created_at
                            })
                
                sessions.append({
                    'session_id': session_id,
                    'summary': session_summary or '',
                    'created_at': created_at,
                    'interaction_contexts': interaction_list
                })
            
            conn.close()
            logger.info(f"Fetched {len(sessions)} sessions for user {user_id}")
            return sessions
            
        except Exception as e:
            logger.error(f"Error fetching user sessions: {e}", exc_info=True)
            return []  # Safe fallback - no degradation
    
    def _extract_entities(self, context: dict) -> list:
        """
        Extract essential entities from context
        """
        # TODO: Implement entity extraction
        return []
    
    def _generate_summary(self, context: dict) -> str:
        """
        Generate conversation summary
        """
        # TODO: Implement summary generation
        return ""
    
    def get_or_create_session_context(self, session_id: str, user_id: Optional[str] = None) -> Dict:
        """Enhanced context retrieval with caching"""
        import time
        
        # In-memory cache check first
        if session_id in self._session_cache:
            cache_entry = self._session_cache[session_id]
            if time.time() - cache_entry['timestamp'] < 300:  # 5 min cache
                logger.debug(f"Cache hit for session {session_id}")
                return cache_entry['context']
        
        # Batch database queries
        conn = None
        try:
            conn = sqlite3.connect(self.db_path)
            cursor = conn.cursor()
            
            # Single query for all context data
            query = """
            SELECT 
                s.context_data,
                s.user_metadata,
                s.last_activity,
                u.persona_summary,
                ic.interaction_summary
            FROM sessions s
            LEFT JOIN user_contexts u ON s.user_id = u.user_id
            LEFT JOIN interaction_contexts ic ON s.session_id = ic.session_id
            WHERE s.session_id = ?
            ORDER BY ic.created_at DESC
            LIMIT 10
            """
            
            cursor.execute(query, (session_id,))
            results = cursor.fetchall()
            
            # Process results efficiently
            context = self._build_context_from_results(results, session_id, user_id)
            
            # Update cache
            self._session_cache[session_id] = {
                'context': context,
                'timestamp': time.time()
            }
            
            return context
            
        except Exception as e:
            logger.error(f"Error in get_or_create_session_context: {e}", exc_info=True)
            # Return safe fallback
            return {
                "session_id": session_id,
                "user_id": user_id or "Test_Any",
                "interaction_contexts": [],
                "session_context": None,
                "preferences": {},
                "active_tasks": [],
                "user_context_loaded": False
            }
        finally:
            if conn:
                conn.close()
    
    def _build_context_from_results(self, results: list, session_id: str, user_id: Optional[str]) -> Dict:
        """Build context dictionary from batch query results"""
        context = {
            "session_id": session_id,
            "user_id": user_id or "Test_Any",
            "interaction_contexts": [],
            "session_context": None,
            "user_context": "",
            "preferences": {},
            "active_tasks": [],
            "user_context_loaded": False
        }
        
        if not results:
            return context
        
        # Process first row for session data
        first_row = results[0]
        if first_row[0]:  # context_data
            try:
                session_data = json.loads(first_row[0])
                context["preferences"] = session_data.get("preferences", {})
                context["active_tasks"] = session_data.get("active_tasks", [])
            except:
                pass
        
        if first_row[1]:  # user_metadata
            try:
                user_metadata = json.loads(first_row[1])
                context["preferences"].update(user_metadata.get("preferences", {}))
            except:
                pass
        
        context["last_activity"] = first_row[2]  # last_activity
        
        if first_row[3]:  # persona_summary
            context["user_context"] = first_row[3]
            context["user_context_loaded"] = True
        
        # Process interaction contexts
        seen_interactions = set()
        for row in results:
            if row[4]:  # interaction_summary
                # Deduplicate interactions
                if row[4] not in seen_interactions:
                    seen_interactions.add(row[4])
                    context["interaction_contexts"].append({
                        "summary": row[4],
                        "timestamp": None  # Could extract from row if available
                    })
        
        return context