Spaces:

JatinAutonomousLabs
/

Research_AI_Assistant

Sleeping

JatsTheAIGen commited on Nov 7

Commit

fad63bf

1 Parent(s): f5d3311

feat: Add comprehensive step-by-step system readiness logging

- Add detailed 7-step startup process in main.py with component verification
- Enhance orchestration initialization with 6-step process and health checks
- Add step-by-step logging for Flask API initialization
- Include component status summaries and service endpoint information
- Add final 'SYSTEM READY' confirmation after all components initialized
- Improve container log readability with clear step indicators and status icons
- Log configuration details (ZeroGPU, local models, database paths)
- Add component health verification before marking system as ready

Files changed (4) hide show

app.py +89 -13
flask_api.py +14 -3
flask_api_standalone.py +29 -7
main.py +103 -22

app.py CHANGED Viewed

@@ -2068,37 +2068,113 @@ def initialize_orchestrator():
             logger.debug(f"Could not load ZeroGPU config: {e}")
         # Initialize LLM Router
-        logger.info("Step 1/6: Initializing LLM Router...")
         llm_router = LLMRouter(hf_token, use_local_models=True, zero_gpu_config=zero_gpu_config)
-        logger.info("✓ LLM Router initialized")
         # Initialize Agents
-        logger.info("Step 2/6: Initializing Agents...")
         agents = {
             'intent_recognition': create_intent_agent(llm_router),
-            'response_synthesis': create_synthesis_agent(llm_router),
-            'safety_check': create_safety_agent(llm_router),
         }
-        # Add skills identification agent
         skills_agent = create_skills_identification_agent(llm_router)
         agents['skills_identification'] = skills_agent
-        logger.info("✓ Skills identification agent initialized")
-        logger.info(f"✓ Initialized {len(agents)} agents")
         # Initialize Context Manager (with LLM router for context generation)
-        logger.info("Step 3/6: Initializing Context Manager...")
         context_manager = EfficientContextManager(llm_router=llm_router)
-        logger.info("✓ Context Manager initialized")
         # Initialize Orchestrator
-        logger.info("Step 4/6: Initializing Orchestrator...")
         orchestrator = MVPOrchestrator(llm_router, context_manager, agents)
-        logger.info("✓ Orchestrator initialized")
         logger.info("=" * 60)
-        logger.info("ORCHESTRATION SYSTEM READY")
         logger.info("=" * 60)
     except Exception as e:

             logger.debug(f"Could not load ZeroGPU config: {e}")
         # Initialize LLM Router
+        logger.info("[ORCHESTRATION STEP 1/6] Initializing LLM Router...")
+        logger.info("  → Checking inference backend configuration...")
+        if zero_gpu_config and zero_gpu_config.get("enabled"):
+            logger.info(f"  → ZeroGPU API: {zero_gpu_config.get('base_url', 'N/A')}")
+            if zero_gpu_config.get("per_user_mode"):
+                logger.info("  → Mode: Per-user (multi-tenant)")
+            else:
+                logger.info("  → Mode: Service account (single-tenant)")
+        else:
+            logger.info("  → ZeroGPU API: Disabled (using local/HF fallback)")
+        logger.info("  → Local models: Enabled (lazy loading)")
         llm_router = LLMRouter(hf_token, use_local_models=True, zero_gpu_config=zero_gpu_config)
+        logger.info("  ✓ LLM Router initialized")
+        logger.info("  ✓ Inference routing configured")
         # Initialize Agents
+        logger.info("[ORCHESTRATION STEP 2/6] Initializing AI Agents...")
+        logger.info("  → Creating intent recognition agent...")
         agents = {
             'intent_recognition': create_intent_agent(llm_router),
         }
+        logger.info("  ✓ Intent recognition agent ready")
+        logger.info("  → Creating response synthesis agent...")
+        agents['response_synthesis'] = create_synthesis_agent(llm_router)
+        logger.info("  ✓ Response synthesis agent ready")
+        logger.info("  → Creating safety check agent...")
+        agents['safety_check'] = create_safety_agent(llm_router)
+        logger.info("  ✓ Safety check agent ready")
+        logger.info("  → Creating skills identification agent...")
         skills_agent = create_skills_identification_agent(llm_router)
         agents['skills_identification'] = skills_agent
+        logger.info("  ✓ Skills identification agent ready")
+        logger.info(f"  ✓ All {len(agents)} agents initialized successfully")
         # Initialize Context Manager (with LLM router for context generation)
+        logger.info("[ORCHESTRATION STEP 3/6] Initializing Context Manager...")
+        logger.info("  → Setting up session database...")
+        logger.info(f"  → Database path: {settings.db_path if hasattr(settings, 'db_path') else '/tmp/sessions.db'}")
         context_manager = EfficientContextManager(llm_router=llm_router)
+        logger.info("  ✓ Context Manager initialized")
+        logger.info("  ✓ Session storage ready")
         # Initialize Orchestrator
+        logger.info("[ORCHESTRATION STEP 4/6] Initializing Orchestrator...")
+        logger.info("  → Connecting LLM Router, Context Manager, and Agents...")
         orchestrator = MVPOrchestrator(llm_router, context_manager, agents)
+        logger.info("  ✓ Orchestrator initialized")
+        logger.info("  ✓ Request processing pipeline ready")
+        # Component Health Verification
+        logger.info("[ORCHESTRATION STEP 5/6] Verifying component health...")
+        health_status = {}
+        # Check LLM Router
+        if llm_router:
+            health_status['LLM Router'] = True
+            logger.info("  ✓ LLM Router: Healthy")
+        else:
+            health_status['LLM Router'] = False
+            logger.error("  ✗ LLM Router: Not available")
+        # Check Agents
+        if agents and len(agents) == 4:
+            health_status['Agents'] = True
+            logger.info(f"  ✓ Agents: All {len(agents)} agents healthy")
+        else:
+            health_status['Agents'] = False
+            logger.error(f"  ✗ Agents: Only {len(agents) if agents else 0} agents available")
+        # Check Context Manager
+        if context_manager:
+            health_status['Context Manager'] = True
+            logger.info("  ✓ Context Manager: Healthy")
+        else:
+            health_status['Context Manager'] = False
+            logger.error("  ✗ Context Manager: Not available")
+        # Check Orchestrator
+        if orchestrator:
+            health_status['Orchestrator'] = True
+            logger.info("  ✓ Orchestrator: Healthy")
+        else:
+            health_status['Orchestrator'] = False
+            logger.error("  ✗ Orchestrator: Not available")
+        logger.info("  ✓ Component health verification complete")
+        # Final Readiness Confirmation
+        logger.info("[ORCHESTRATION STEP 6/6] Final readiness confirmation...")
+        all_healthy = all(health_status.values())
+        if all_healthy:
+            logger.info("  ✓ All components healthy")
+        else:
+            failed_components = [comp for comp, status in health_status.items() if not status]
+            logger.warning(f"  ⚠ Some components not healthy: {', '.join(failed_components)}")
+        logger.info("=" * 60)
+        logger.info("✅ ORCHESTRATION SYSTEM READY")
         logger.info("=" * 60)
+        logger.info("Component Status Summary:")
+        for component, status in health_status.items():
+            status_icon = "✓" if status else "✗"
+            logger.info(f"  {status_icon} {component}: {'Ready' if status else 'Not Available'}")
         logger.info("=" * 60)
     except Exception as e:

flask_api.py CHANGED Viewed

@@ -43,6 +43,9 @@ def initialize_orchestrator():
         logger.info("=" * 60)
         logger.info("INITIALIZING FLASK API ORCHESTRATOR")
         logger.info("=" * 60)
         # Import from app.py (this won't trigger app.py's launch code)
         # The orchestrator is already initialized in app.py's module-level code
@@ -51,13 +54,21 @@ def initialize_orchestrator():
         _orchestrator = orchestrator
         _process_message_async = process_message_async
         if _orchestrator is not None:
-            logger.info("✓ AI ORCHESTRATOR READY (shared with Gradio)")
         else:
-            logger.warning("⚠ Orchestrator not available - some features may be limited")
         _initialized = True
-        logger.info("=" * 60)
     except Exception as e:
         logger.error(f"Failed to initialize orchestrator: {e}", exc_info=True)

         logger.info("=" * 60)
         logger.info("INITIALIZING FLASK API ORCHESTRATOR")
         logger.info("=" * 60)
+        logger.info("[FLASK API] Loading orchestrator from app.py...")
+        logger.info("  → Orchestrator is shared with Gradio interface")
+        logger.info("  → No duplicate initialization needed")
         # Import from app.py (this won't trigger app.py's launch code)
         # The orchestrator is already initialized in app.py's module-level code
         _orchestrator = orchestrator
         _process_message_async = process_message_async
+        logger.info("[FLASK API] Verifying orchestrator status...")
         if _orchestrator is not None:
+            logger.info("  ✓ Orchestrator loaded successfully")
+            logger.info("  ✓ Request processing available")
+            logger.info("=" * 60)
+            logger.info("✅ AI ORCHESTRATOR READY (shared with Gradio)")
+            logger.info("=" * 60)
         else:
+            logger.warning("  ⚠ Orchestrator not available")
+            logger.warning("  ⚠ Some features may be limited")
+            logger.info("=" * 60)
+            logger.warning("⚠ FLASK API RUNNING IN DEGRADED MODE")
+            logger.info("=" * 60)
         _initialized = True
     except Exception as e:
         logger.error(f"Failed to initialize orchestrator: {e}", exc_info=True)

flask_api_standalone.py CHANGED Viewed

@@ -93,28 +93,50 @@ def initialize_orchestrator():
             logger.debug(f"Could not load ZeroGPU config: {e}")
         # Initialize LLM Router with local model loading enabled
-        logger.info("Initializing LLM Router with local GPU model loading...")
         llm_router = LLMRouter(hf_token, use_local_models=True, zero_gpu_config=zero_gpu_config)
-        logger.info("Initializing Agents...")
         agents = {
             'intent_recognition': create_intent_agent(llm_router),
             'response_synthesis': create_synthesis_agent(llm_router),
             'safety_check': create_safety_agent(llm_router),
             'skills_identification': create_skills_identification_agent(llm_router)
         }
-        logger.info("Initializing Context Manager...")
         context_manager = EfficientContextManager(llm_router=llm_router)
-        logger.info("Initializing Orchestrator...")
         orchestrator = MVPOrchestrator(llm_router, context_manager, agents)
         orchestrator_available = True
         logger.info("=" * 60)
-        logger.info("✓ AI ORCHESTRATOR READY")
-        logger.info("  - Local GPU models enabled")
-        logger.info("  - MAX_WORKERS: 4")
         logger.info("=" * 60)
         return True

             logger.debug(f"Could not load ZeroGPU config: {e}")
         # Initialize LLM Router with local model loading enabled
+        logger.info("[FLASK API STEP 1/5] Initializing LLM Router...")
+        logger.info("  → Configuring inference backend...")
+        if zero_gpu_config and zero_gpu_config.get("enabled"):
+            logger.info(f"  → ZeroGPU API: {zero_gpu_config.get('base_url', 'N/A')}")
+        else:
+            logger.info("  → ZeroGPU API: Disabled (using local/HF fallback)")
+        logger.info("  → Local models: Enabled (lazy loading)")
         llm_router = LLMRouter(hf_token, use_local_models=True, zero_gpu_config=zero_gpu_config)
+        logger.info("  ✓ LLM Router initialized")
+        logger.info("[FLASK API STEP 2/5] Initializing AI Agents...")
+        logger.info("  → Creating 4 specialized agents...")
         agents = {
             'intent_recognition': create_intent_agent(llm_router),
             'response_synthesis': create_synthesis_agent(llm_router),
             'safety_check': create_safety_agent(llm_router),
             'skills_identification': create_skills_identification_agent(llm_router)
         }
+        logger.info(f"  ✓ All {len(agents)} agents initialized")
+        logger.info("[FLASK API STEP 3/5] Initializing Context Manager...")
+        logger.info("  → Setting up session storage...")
         context_manager = EfficientContextManager(llm_router=llm_router)
+        logger.info("  ✓ Context Manager initialized")
+        logger.info("[FLASK API STEP 4/5] Initializing Orchestrator...")
+        logger.info("  → Connecting all components...")
         orchestrator = MVPOrchestrator(llm_router, context_manager, agents)
+        logger.info("  ✓ Orchestrator initialized")
+        logger.info("[FLASK API STEP 5/5] Verifying system readiness...")
         orchestrator_available = True
+        if llm_router and context_manager and orchestrator and agents:
+            logger.info("  ✓ All components verified")
+        else:
+            logger.warning("  ⚠ Some components may not be fully initialized")
+        logger.info("=" * 60)
+        logger.info("✅ AI ORCHESTRATOR READY (Flask API)")
         logger.info("=" * 60)
+        logger.info("Configuration:")
+        logger.info("  • Local GPU models: Enabled (lazy loading)")
+        logger.info("  • MAX_WORKERS: 4")
+        logger.info("  • ZeroGPU API: " + ("Enabled" if (zero_gpu_config and zero_gpu_config.get("enabled")) else "Disabled"))
         logger.info("=" * 60)
         return True

main.py CHANGED Viewed

@@ -169,51 +169,132 @@ def start_flask_background():
 def main():
     """Main entry point for HF Spaces"""
-    logger.info("🚀 Starting AI Research Assistant MVP")
-    logger.info("=" * 60)
-    # Check for HF Token
     hf_token = os.getenv('HF_TOKEN')
-    if not hf_token:
-        logger.warning("HF_TOKEN not found in environment. Some features may be limited.")
-    # Start Flask API in background (for external integrations)
     flask_thread = start_flask_background()
-    # Import the already-configured interface from app.py
-    # This imports the interface without triggering app.py's launch code
-    # (app.py's launch only runs when app.py is executed directly, not when imported)
-    logger.info("Creating interface from app.py (all handlers already initialized)...")
     demo, components = create_mobile_optimized_interface()
-    logger.info("✓ Interface created with all API endpoints and handlers")
-    # Detect if running on HF Spaces
-    # HF Spaces provides its own public URL, so share is not needed
     try:
         from spaces import GPU
         is_hf_spaces = True
-        logger.info("✓ Detected Hugging Face Spaces - using built-in public URL")
     except ImportError:
         is_hf_spaces = False
-        logger.info("✓ Local deployment - will create Gradio share link if needed")
     # Launch configuration
-    # Note: show_api=True is already set in app.py's interface creation,
-    # but we ensure it here as well for clarity
     launch_config = {
         'server_name': '0.0.0.0',
         'server_port': 7860,
         'share': not is_hf_spaces,  # Only create share link when not on HF Spaces
-        'show_api': True,  # Enable API endpoints (also set in app.py, but explicit here)
         'debug': False
     }
-    logger.info("=" * 60)
-    logger.info("✅ Application ready for launch")
     if flask_thread:
-        logger.info("✓ Flask API running in background")
-    logger.info("=" * 60)
     return demo.launch(**launch_config)
 if __name__ == "__main__":

 def main():
     """Main entry point for HF Spaces"""
+    logger.info("=" * 70)
+    logger.info("🚀 SYSTEM STARTUP - AI Research Assistant MVP")
+    logger.info("=" * 70)
+    # Step 1: Environment Configuration Check
+    logger.info("[STEP 1/7] Checking environment configuration...")
     hf_token = os.getenv('HF_TOKEN')
+    if hf_token:
+        logger.info("  ✓ HF_TOKEN configured")
+    else:
+        logger.warning("  ⚠ HF_TOKEN not found - some features may be limited")
+    # Check ZeroGPU configuration
+    use_zero_gpu = os.getenv('USE_ZERO_GPU', 'false').lower() == 'true'
+    if use_zero_gpu:
+        zero_gpu_url = os.getenv('ZERO_GPU_API_URL', '')
+        if zero_gpu_url:
+            logger.info(f"  ✓ ZeroGPU API enabled: {zero_gpu_url}")
+        else:
+            logger.warning("  ⚠ ZeroGPU enabled but URL not configured")
+    else:
+        logger.info("  ✓ ZeroGPU API disabled (using local/HF fallback)")
+    logger.info("  ✓ Environment check complete")
+    # Step 2: Initialize Orchestration System (via app.py import)
+    logger.info("[STEP 2/7] Initializing orchestration system...")
+    logger.info("  → This step initializes: LLM Router, Agents, Context Manager, Orchestrator")
+    logger.info("  → Detailed logs available in orchestration initialization section")
+    # Step 3: Start Flask API in background
+    logger.info("[STEP 3/7] Starting Flask API server...")
     flask_thread = start_flask_background()
+    if flask_thread:
+        logger.info("  ✓ Flask API started successfully")
+    else:
+        logger.warning("  ⚠ Flask API not started (continuing with Gradio only)")
+    # Step 4: Create Gradio Interface
+    logger.info("[STEP 4/7] Creating Gradio interface...")
+    logger.info("  → Loading UI components and API endpoints...")
     demo, components = create_mobile_optimized_interface()
+    logger.info("  ✓ Gradio interface created")
+    logger.info("  ✓ API endpoints registered")
+    # Step 5: Verify Component Status
+    logger.info("[STEP 5/7] Verifying component status...")
+    if components and not components.get('mock_mode'):
+        logger.info("  ✓ All components initialized successfully")
+        if 'orchestrator' in components and components['orchestrator']:
+            logger.info("  ✓ Orchestrator available")
+        else:
+            logger.warning("  ⚠ Orchestrator not available (degraded mode)")
+    else:
+        logger.warning("  ⚠ Running in mock/fallback mode")
+    logger.info("  ✓ Component verification complete")
+    # Step 6: Detect Deployment Environment
+    logger.info("[STEP 6/7] Detecting deployment environment...")
     try:
         from spaces import GPU
         is_hf_spaces = True
+        logger.info("  ✓ Detected Hugging Face Spaces")
+        logger.info("  ✓ Using built-in public URL (no share link needed)")
     except ImportError:
         is_hf_spaces = False
+        logger.info("  ✓ Detected local deployment")
+        logger.info("  → Will create Gradio share link if needed")
+    logger.info("  ✓ Environment detection complete")
+    # Step 7: Final System Readiness Check
+    logger.info("[STEP 7/7] Performing final system readiness check...")
+    readiness_checks = []
+    # Check Gradio interface
+    if demo:
+        readiness_checks.append(("Gradio Interface", True))
+        logger.info("  ✓ Gradio interface ready")
+    else:
+        readiness_checks.append(("Gradio Interface", False))
+        logger.error("  ✗ Gradio interface not ready")
+    # Check Flask API
+    if flask_thread and flask_thread.is_alive():
+        readiness_checks.append(("Flask API", True))
+        logger.info("  ✓ Flask API running")
+    else:
+        readiness_checks.append(("Flask API", False))
+        logger.warning("  ⚠ Flask API not running (optional)")
+    # Check Orchestrator
+    if components and components.get('orchestrator'):
+        readiness_checks.append(("Orchestrator", True))
+        logger.info("  ✓ Orchestrator available")
+    else:
+        readiness_checks.append(("Orchestrator", False))
+        logger.warning("  ⚠ Orchestrator not available (degraded mode)")
     # Launch configuration
     launch_config = {
         'server_name': '0.0.0.0',
         'server_port': 7860,
         'share': not is_hf_spaces,  # Only create share link when not on HF Spaces
+        'show_api': True,  # Enable API endpoints
         'debug': False
     }
+    # Final System Ready Message
+    logger.info("=" * 70)
+    logger.info("✅ SYSTEM READY - All components initialized")
+    logger.info("=" * 70)
+    logger.info("Component Status:")
+    for component, status in readiness_checks:
+        status_icon = "✓" if status else "⚠"
+        logger.info(f"  {status_icon} {component}: {'Ready' if status else 'Not Available'}")
+    logger.info("")
+    logger.info("Service Endpoints:")
+    logger.info("  • Gradio UI: http://0.0.0.0:7860")
+    logger.info("  • Gradio API: http://0.0.0.0:7860/api/")
     if flask_thread:
+        logger.info("  • Flask API: http://0.0.0.0:5001/api/chat")
+        logger.info("  • Flask Health: http://0.0.0.0:5001/health")
+    logger.info("")
+    logger.info("🚀 Launching application...")
+    logger.info("=" * 70)
     return demo.launch(**launch_config)
 if __name__ == "__main__":