From 4118612034171a3b5a9a828e97d13c3a612f6e57 Mon Sep 17 00:00:00 2001
From: Trey <tgrunnagle@gmail.com>
Date: Thu, 6 Nov 2025 07:48:15 -0800
Subject: [PATCH] Start server before workload and registry ingestion

Speed up server startup by moving ingestion to background

- Removed blocking registry and workload ingestion from server startup in `cli.py`
- Server now starts immediately after configuration validation and database migration
- Ingestion now happens asynchronously in the polling manager background thread
- Eliminated artificial startup delay in `polling_manager.py` that was waiting for minimum polling interval
- Background thread starts polling after 3-second grace period instead of waiting for initial ingestion to complete
- Server is ready to accept connections in seconds instead of minutes
- Ingestion failures no longer prevent server startup - polling will retry automatically

This change transforms the startup from synchronous blocking model to asynchronous background processing, dramatically reducing time-to-ready while maintaining the same functionality through the existing polling mechanism.
---
 src/mcp_optimizer/cli.py             | 53 +---------------------------
 src/mcp_optimizer/polling_manager.py |  4 ---
 2 files changed, 1 insertion(+), 56 deletions(-)

diff --git a/src/mcp_optimizer/cli.py b/src/mcp_optimizer/cli.py
index ea76bce..314fffb 100644
--- a/src/mcp_optimizer/cli.py
+++ b/src/mcp_optimizer/cli.py
@@ -1,4 +1,3 @@
-import asyncio
 import os
 import signal
 from pathlib import Path
@@ -10,9 +9,7 @@
 
 from mcp_optimizer.config import ConfigurationError, MCPOptimizerConfig, get_config
 from mcp_optimizer.configure_logging import configure_logging
-from mcp_optimizer.db.config import DatabaseConfig, run_migrations
-from mcp_optimizer.embeddings import EmbeddingManager
-from mcp_optimizer.ingestion import IngestionService
+from mcp_optimizer.db.config import run_migrations
 from mcp_optimizer.polling_manager import configure_polling, shutdown_polling
 from mcp_optimizer.server import initialize_server_components
 from mcp_optimizer.toolhive.toolhive_client import ToolhiveClient
@@ -218,54 +215,6 @@ def main(**kwargs: Any) -> None:
     initialize_server_components(config)
 
     try:
-        # Pass config values to components instead of using get_config()
-        db_config = DatabaseConfig(database_url=config.async_db_url)
-        embedding_manager = EmbeddingManager(
-            model_name=config.embedding_model_name,
-            enable_cache=config.enable_embedding_cache,
-            threads=config.embedding_threads,
-            fastembed_cache_path=config.fastembed_cache_path,
-        )
-        ingestion_service = IngestionService(
-            db_config,
-            embedding_manager,
-            mcp_timeout=config.mcp_timeout,
-            registry_ingestion_batch_size=config.registry_ingestion_batch_size,
-            workload_ingestion_batch_size=config.workload_ingestion_batch_size,
-            encoding=config.encoding,
-            skipped_workloads=config.skipped_workloads,
-            runtime_mode=config.runtime_mode,
-            k8s_api_server_url=config.k8s_api_server_url,
-            k8s_namespace=config.k8s_namespace,
-            k8s_all_namespaces=config.k8s_all_namespaces,
-        )
-
-        async def run_ingestion():
-            """Run ingestion tasks in a single event loop."""
-            await ingestion_service.ingest_registry(toolhive_client=toolhive_client)
-            await ingestion_service.ingest_workloads(toolhive_client=toolhive_client)
-            # Dispose the database engine to prevent event loop conflicts
-            # The server will create a new engine in its own event loop
-            await db_config.close()
-
-        logger.info("Starting initial ingestion process")
-        try:
-            asyncio.run(run_ingestion())
-            logger.info("Initial ingestion process completed")
-        except Exception as e:
-            # Import here to avoid circular dependency
-            from mcp_optimizer.toolhive.toolhive_client import ToolhiveConnectionError
-
-            if isinstance(e, ToolhiveConnectionError):
-                logger.critical(
-                    "Unable to connect to ToolHive after exhausting all retries. "
-                    "Please ensure ToolHive is running and accessible.",
-                    error=str(e),
-                )
-                raise click.ClickException(f"Failed to connect to ToolHive: {e}. Exiting.") from e
-            # Re-raise other exceptions
-            raise
-
         # Configure polling manager for the server
         logger.info(
             "Configuring polling manager",
diff --git a/src/mcp_optimizer/polling_manager.py b/src/mcp_optimizer/polling_manager.py
index 05c5fdd..bd19905 100644
--- a/src/mcp_optimizer/polling_manager.py
+++ b/src/mcp_optimizer/polling_manager.py
@@ -301,10 +301,6 @@ async def start_polling(self) -> None:
         # Store the event loop for later use by targeted polling
         self._loop = asyncio.get_running_loop()
 
-        startup_time_sec = min(self.workload_polling_interval, self.registry_polling_interval)
-        logger.info("Delaying polling start to allow server startup", seconds=startup_time_sec)
-        await asyncio.sleep(startup_time_sec)
-
         logger.info(
             "Creating polling tasks",
             workload_interval_seconds=self.workload_polling_interval,