fix: warmup ACP subprocess eagerly to avoid 30s cold-start on status

The pool refactor made ACP client creation lazy, causing the first /llm/health call to spawn + initialize + prompt Gemini in one request (30s+). Now warmup() eagerly starts the subprocess on mcplocal boot. Also fetch models in parallel with LLM health check. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-25 01:37:30 +00:00
parent e8ac500ae9
commit 9bd3127519
3 changed files with 26 additions and 11 deletions
--- a/src/cli/src/commands/status.ts
+++ b/src/cli/src/commands/status.ts
@@ -47,7 +47,7 @@ function defaultCheckHealth(url: string): Promise<boolean> {
 */
 function defaultCheckLlm(mcplocalUrl: string): Promise<string> {
  return new Promise((resolve) => {
-    const req = http.get(`${mcplocalUrl}/llm/health`, { timeout: 30000 }, (res) => {
+    const req = http.get(`${mcplocalUrl}/llm/health`, { timeout: 45000 }, (res) => {
      const chunks: Buffer[] = [];
      res.on('data', (chunk: Buffer) => chunks.push(chunk));
      res.on('end', () => {
@@ -167,8 +167,9 @@ export function createStatusCommand(deps?: Partial<StatusCommandDeps>): Command
        return;
      }

-      // LLM check with spinner — queries mcplocal's /llm/health endpoint
+      // LLM check + models fetch in parallel — queries mcplocal endpoints
      const llmPromise = checkLlm(config.mcplocalUrl);
+      const modelsPromise = fetchModels(config.mcplocalUrl);

      if (isTTY) {
        let frame = 0;
@@ -177,7 +178,7 @@ export function createStatusCommand(deps?: Partial<StatusCommandDeps>): Command
          frame++;
        }, 80);

-        const llmStatus = await llmPromise;
+        const [llmStatus, models] = await Promise.all([llmPromise, modelsPromise]);
        clearInterval(interval);

        if (llmStatus === 'ok' || llmStatus === 'ok (key stored)') {
@@ -185,20 +186,20 @@ export function createStatusCommand(deps?: Partial<StatusCommandDeps>): Command
        } else {
          write(`${CLEAR_LINE}LLM:        ${llmLabel} ${RED}✗ ${llmStatus}${RESET}\n`);
        }
+        if (models.length > 0) {
+          log(`${DIM}            Available: ${models.join(', ')}${RESET}`);
+        }
      } else {
        // Non-TTY: no spinner, just wait and print
-        const llmStatus = await llmPromise;
+        const [llmStatus, models] = await Promise.all([llmPromise, modelsPromise]);
        if (llmStatus === 'ok' || llmStatus === 'ok (key stored)') {
          log(`LLM:        ${llmLabel} ✓ ${llmStatus}`);
        } else {
          log(`LLM:        ${llmLabel} ✗ ${llmStatus}`);
        }
-      }
-
-      // Show available models (non-blocking, best effort)
-      const models = await fetchModels(config.mcplocalUrl);
-      if (models.length > 0) {
-        log(`${DIM}            Available: ${models.join(', ')}${RESET}`);
+        if (models.length > 0) {
+          log(`${DIM}            Available: ${models.join(', ')}${RESET}`);
+        }
      }
    });
 }