feat: add clear error message when llama-server not running

2026-02-05 13:17:56 -08:00
parent e8079347c7
commit 8e7fa24fd6
2 changed files with 28 additions and 8 deletions
@@ -48,14 +48,22 @@ export class LlamaCppClient implements ModelClient {
      headers['Authorization'] = `Bearer ${this.authToken}`;
    }

-    const response = await fetch(`${this.endpoint}/v1/chat/completions`, {
-      method: 'POST',
-      headers,
-      body: JSON.stringify({
-        messages,
-        max_tokens: request.maxTokens ?? 2048,
-      }),
-    });
+    let response: Response;
+    try {
+      response = await fetch(`${this.endpoint}/v1/chat/completions`, {
+        method: 'POST',
+        headers,
+        body: JSON.stringify({
+          messages,
+          max_tokens: request.maxTokens ?? 2048,
+        }),
+      });
+    } catch (error) {
+      if (error instanceof TypeError && error.message.includes('fetch failed')) {
+        throw new Error(`llama-server not running at ${this.endpoint}`);
+      }
+      throw error;
+    }

    if (!response.ok) {
      const text = await response.text();