feat(models): add streaming and tier switching to ModelRouter

This commit is contained in:
William Valentin
2026-02-05 10:48:41 -08:00
parent 896a0da10e
commit 9a48c39b07
2 changed files with 122 additions and 3 deletions
+64 -1
View File
@@ -1,6 +1,6 @@
import { describe, it, expect, vi, beforeEach } from 'vitest';
import { ModelRouter } from './router.js';
import type { ModelClient, ChatResponse } from './types.js';
import type { ModelClient, ChatResponse, ChatStreamEvent } from './types.js';
describe('ModelRouter', () => {
const createMockClient = (name: string, shouldFail = false): ModelClient => ({
@@ -78,3 +78,66 @@ describe('ModelRouter', () => {
expect(defaultClient.chat).not.toHaveBeenCalled();
});
});
describe('ModelRouter streaming', () => {
it('streams from primary client', async () => {
const mockStream = async function* (): AsyncIterable<ChatStreamEvent> {
yield { type: 'content', content: 'Hello' };
yield { type: 'done', usage: { inputTokens: 5, outputTokens: 3 } };
};
const mockClient = {
chat: vi.fn(),
chatStream: vi.fn().mockReturnValue(mockStream()),
};
const router = new ModelRouter({
default: mockClient,
fallbackChain: [],
});
const chunks: string[] = [];
for await (const event of router.chatStream({ messages: [] })) {
if (event.type === 'content' && event.content) {
chunks.push(event.content);
}
}
expect(chunks).toEqual(['Hello']);
});
it('falls back when primary stream fails', async () => {
const failingStream = async function* (): AsyncIterable<ChatStreamEvent> {
yield { type: 'error', error: new Error('Primary failed') };
};
const fallbackStream = async function* (): AsyncIterable<ChatStreamEvent> {
yield { type: 'content', content: 'Fallback' };
yield { type: 'done', usage: { inputTokens: 5, outputTokens: 3 } };
};
const primaryClient = {
chat: vi.fn(),
chatStream: vi.fn().mockReturnValue(failingStream()),
};
const fallbackClient = {
chat: vi.fn(),
chatStream: vi.fn().mockReturnValue(fallbackStream()),
};
const router = new ModelRouter({
default: primaryClient,
fallbackChain: [fallbackClient],
});
const chunks: string[] = [];
for await (const event of router.chatStream({ messages: [] })) {
if (event.type === 'content' && event.content) {
chunks.push(event.content);
}
}
expect(chunks).toEqual(['Fallback']);
});
});
+58 -2
View File
@@ -1,4 +1,4 @@
import type { ChatRequest, ChatResponse, ModelClient } from './types.js';
import type { ChatRequest, ChatResponse, ChatStreamEvent, ModelClient } from './types.js';
export type ModelTier = 'fast' | 'default' | 'complex' | 'local';
@@ -14,6 +14,7 @@ export class ModelRouter implements ModelClient {
private clients: Map<ModelTier, ModelClient>;
private defaultClient: ModelClient;
private fallbackChain: ModelClient[];
private currentTier: ModelTier = 'default';
constructor(config: ModelRouterConfig) {
this.clients = new Map();
@@ -26,8 +27,25 @@ export class ModelRouter implements ModelClient {
if (config.local) this.clients.set('local', config.local);
}
setTier(tier: ModelTier): boolean {
if (this.clients.has(tier)) {
this.currentTier = tier;
return true;
}
return false;
}
getTier(): ModelTier {
return this.currentTier;
}
getAvailableTiers(): ModelTier[] {
return Array.from(this.clients.keys());
}
async chat(request: ChatRequest, tier?: ModelTier): Promise<ChatResponse> {
const primaryClient = tier ? this.clients.get(tier) ?? this.defaultClient : this.defaultClient;
const useTier = tier ?? this.currentTier;
const primaryClient = this.clients.get(useTier) ?? this.defaultClient;
const errors: Error[] = [];
// Try primary client
@@ -52,6 +70,44 @@ export class ModelRouter implements ModelClient {
throw new Error(`All model providers failed: ${errors.map(e => e.message).join(', ')}`);
}
async *chatStream(request: ChatRequest, tier?: ModelTier): AsyncIterable<ChatStreamEvent> {
const useTier = tier ?? this.currentTier;
const primaryClient = this.clients.get(useTier) ?? this.defaultClient;
if (primaryClient.chatStream) {
let hasError = false;
for await (const event of primaryClient.chatStream(request)) {
if (event.type === 'error') {
hasError = true;
console.warn(`Primary stream failed: ${event.error?.message}`);
break;
}
yield event;
}
if (!hasError) return;
}
// Try fallback chain
for (const fallbackClient of this.fallbackChain) {
if (!fallbackClient.chatStream) continue;
let hasError = false;
for await (const event of fallbackClient.chatStream(request)) {
if (event.type === 'error') {
hasError = true;
console.warn(`Fallback stream failed: ${event.error?.message}`);
break;
}
yield event;
}
if (!hasError) return;
}
yield { type: 'error', error: new Error('All streaming providers failed') };
}
getClient(tier: ModelTier): ModelClient | undefined {
return this.clients.get(tier);
}