feat: add clear error message when llama-server not running

This commit is contained in:
William Valentin
2026-02-05 13:17:56 -08:00
parent e8079347c7
commit 8e7fa24fd6
2 changed files with 28 additions and 8 deletions
+16 -8
View File
@@ -48,14 +48,22 @@ export class LlamaCppClient implements ModelClient {
headers['Authorization'] = `Bearer ${this.authToken}`;
}
const response = await fetch(`${this.endpoint}/v1/chat/completions`, {
method: 'POST',
headers,
body: JSON.stringify({
messages,
max_tokens: request.maxTokens ?? 2048,
}),
});
let response: Response;
try {
response = await fetch(`${this.endpoint}/v1/chat/completions`, {
method: 'POST',
headers,
body: JSON.stringify({
messages,
max_tokens: request.maxTokens ?? 2048,
}),
});
} catch (error) {
if (error instanceof TypeError && error.message.includes('fetch failed')) {
throw new Error(`llama-server not running at ${this.endpoint}`);
}
throw error;
}
if (!response.ok) {
const text = await response.text();