fix: add model parameter to LlamaCppClient requests

This commit is contained in:
William Valentin
2026-02-05 15:51:33 -08:00
parent 2fc07b4bca
commit d2a597d49d
2 changed files with 8 additions and 0 deletions
+3
View File
@@ -24,6 +24,7 @@ describe('LlamaCppClient', () => {
const client = new LlamaCppClient({
endpoint: 'http://localhost:8080',
model: 'test-model',
});
const response = await client.chat({
@@ -64,6 +65,7 @@ describe('LlamaCppClient', () => {
const client = new LlamaCppClient({
endpoint: 'http://localhost:8080',
model: 'test-model',
});
const events: ChatStreamEvent[] = [];
@@ -87,6 +89,7 @@ describe('LlamaCppClient', () => {
const client = new LlamaCppClient({
endpoint: 'http://localhost:8080',
model: 'test-model',
});
await expect(client.chat({
+5
View File
@@ -2,6 +2,7 @@ import type { ChatRequest, ChatResponse, ChatStreamEvent, ModelClient } from '..
export interface LlamaCppClientConfig {
endpoint: string;
model: string;
authToken?: string;
}
@@ -22,10 +23,12 @@ interface LlamaCppStreamChunk {
export class LlamaCppClient implements ModelClient {
private endpoint: string;
private model: string;
private authToken?: string;
constructor(config: LlamaCppClientConfig) {
this.endpoint = config.endpoint.replace(/\/$/, '');
this.model = config.model;
this.authToken = config.authToken;
}
@@ -54,6 +57,7 @@ export class LlamaCppClient implements ModelClient {
method: 'POST',
headers,
body: JSON.stringify({
model: this.model,
messages,
max_tokens: request.maxTokens ?? 2048,
}),
@@ -106,6 +110,7 @@ export class LlamaCppClient implements ModelClient {
method: 'POST',
headers,
body: JSON.stringify({
model: this.model,
messages,
max_tokens: request.maxTokens ?? 2048,
stream: true,