Files
connectai/tests/lmStudioStreamer.test.ts
T
g1nation 36db170844 feat: v2.2.64 — LM Studio 모델 발견/에러 표시 + macOS 셸 호환성
- LM Studio 모델 dropdown을 SDK system.listDownloadedModels('llm') 으로
  조회하도록 변경. REST /v1/models 는 JIT 옵션이 꺼져 있으면 로드된 모델만
  반환하여 macOS 환경에서 dropdown 이 비거나 fallback 한 줄만 남던 문제 해결.
  SDK 실패 시 REST 로 자동 fallback.
- LM Studio 로드/언로드 실패를 readyBar 의 영속 segment 로 표시. 모델을
  다시 선택하면 clearLmStudioError() 로 해제.
- src/security.ts: PowerShell '&&' rewrite 를 win32 에서만 수행. macOS/Linux
  에서는 'if (\$?) { ... }' 가 zsh/bash 문법 오류라 명령 자체가 깨졌음.
- src/utils.ts: system prompt 에 OS 별 [ENVIRONMENT] 블록 동적 주입
  (셸/경로 스타일/체이닝 연산자). 'cd E:\\... ; ...' 같은 Windows 전용
  예시를 macOS 에서 그대로 따라하던 회귀 차단.
- 테스트 mock 에 listDownloaded() 추가.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-23 09:37:29 +09:00

222 lines
8.5 KiB
TypeScript

/**
* Unit tests for LMStudioStreamer.
*
* Strategy: inject a fake ILMStudioClient that returns a fake model handle whose
* `respond()` yields a controllable async iterable. No real SDK or WebSocket touched.
*/
import { LMStudioStreamer } from '../src/lmstudio/streamer';
import type { ChatStreamEvent } from '../src/lmstudio/streamer';
import type { ILMStudioClient } from '../src/lmstudio/client';
class FakeModel {
public lastChat: any = null;
public lastOpts: any = null;
public cancelCount = 0;
public failNext: Error | null = null;
public chunks: string[] = [];
constructor(opts: { chunks?: string[]; failAfter?: number; throwOnRespond?: Error; stopReason?: string } = {}) {
this.chunks = opts.chunks ?? ['Hel', 'lo, ', 'world'];
this._failAfter = opts.failAfter;
this._throwOnRespond = opts.throwOnRespond;
this.stopReason = opts.stopReason;
}
private _failAfter?: number;
private _throwOnRespond?: Error;
public stopReason: string | undefined;
respond(chat: any, opts: any) {
if (this._throwOnRespond) {
throw this._throwOnRespond;
}
this.lastChat = chat;
this.lastOpts = opts;
const chunks = this.chunks;
const failAfter = this._failAfter;
const stopReason = this.stopReason;
let i = 0;
const self = this;
// Real OngoingPrediction is both async-iterable AND a thenable resolving to a
// PredictionResult with `.stats.stopReason`. Mirror that shape so the streamer
// can read the stop reason after the stream drains.
const prediction: any = {
cancel: async () => { self.cancelCount++; },
then(resolve: (v: any) => void) { resolve({ stats: { stopReason } }); },
[Symbol.asyncIterator]() {
return {
async next() {
if (opts?.signal?.aborted) {
return { value: undefined, done: true };
}
if (failAfter !== undefined && i >= failAfter) {
throw new Error('mid-stream failure');
}
if (i >= chunks.length) {
return { value: undefined, done: true };
}
const fragment = { content: chunks[i++] };
return { value: fragment, done: false };
},
};
},
};
return prediction;
}
}
class FakeClient implements ILMStudioClient {
public model: FakeModel;
public getModelHandleCalls: string[] = [];
constructor(model: FakeModel = new FakeModel()) {
this.model = model;
}
setBaseUrl(_: string): void { /* noop */ }
async load(_: string): Promise<void> { /* noop */ }
async unload(_: string): Promise<void> { /* noop */ }
async listLoaded(): Promise<string[]> { return []; }
async listLoadedCached(): Promise<string[]> { return []; }
async listDownloaded(): Promise<string[]> { return []; }
async isReachable(): Promise<boolean> { return true; }
async getModelHandle(modelKey: string): Promise<any> {
this.getModelHandleCalls.push(modelKey);
return this.model;
}
}
// The streamer emits a trailing { token: '', stopReason } event on normal completion;
// `collect` returns just the non-empty content tokens (what every real consumer uses).
async function collect(stream: AsyncIterable<ChatStreamEvent>): Promise<string[]> {
const out: string[] = [];
for await (const { token } of stream) {
if (token) out.push(token);
}
return out;
}
async function collectEvents(stream: AsyncIterable<ChatStreamEvent>): Promise<ChatStreamEvent[]> {
const out: ChatStreamEvent[] = [];
for await (const ev of stream) out.push(ev);
return out;
}
describe('LMStudioStreamer', () => {
test('streams tokens from the SDK respond iterator', async () => {
const client = new FakeClient(new FakeModel({ chunks: ['Hel', 'lo'] }));
const streamer = new LMStudioStreamer(client);
const tokens = await collect(streamer.stream({
modelName: 'm1',
messages: [{ role: 'user', content: 'hi' }],
temperature: 0.4,
}));
expect(tokens).toEqual(['Hel', 'lo']);
expect(client.getModelHandleCalls).toEqual(['m1']);
expect(client.model.lastOpts.temperature).toBe(0.4);
});
test('emits a trailing stopReason event from prediction stats', async () => {
const client = new FakeClient(new FakeModel({ chunks: ['hi'], stopReason: 'maxPredictedTokensReached' }));
const streamer = new LMStudioStreamer(client);
const events = await collectEvents(streamer.stream({
modelName: 'm1',
messages: [{ role: 'user', content: 'hi' }],
temperature: 0.1,
maxTokens: 64,
}));
expect(events.map(e => e.token)).toEqual(['hi', '']);
expect(events[events.length - 1].stopReason).toBe('maxPredictedTokensReached');
// maxTokens / contextOverflowPolicy are forwarded to the SDK
expect(client.model.lastOpts.maxTokens).toBe(64);
expect(client.model.lastOpts.contextOverflowPolicy).toBe('stopAtLimit');
});
test('passes signal through to the SDK', async () => {
const client = new FakeClient();
const streamer = new LMStudioStreamer(client);
const ac = new AbortController();
await collect(streamer.stream({
modelName: 'm1',
messages: [{ role: 'user', content: 'hi' }],
temperature: 0.2,
signal: ac.signal,
}));
expect(client.model.lastOpts.signal).toBe(ac.signal);
});
test('aborting mid-stream stops cleanly without throwing', async () => {
const client = new FakeClient(new FakeModel({ chunks: ['a', 'b', 'c', 'd'] }));
const streamer = new LMStudioStreamer(client);
const ac = new AbortController();
const out: string[] = [];
const iter = streamer.stream({
modelName: 'm1',
messages: [{ role: 'user', content: 'hi' }],
temperature: 0.3,
signal: ac.signal,
});
for await (const { token } of iter) {
out.push(token);
if (out.length === 2) ac.abort();
}
expect(out.length).toBeGreaterThanOrEqual(2);
expect(out.length).toBeLessThanOrEqual(3);
});
test('rejects when modelName is empty', async () => {
const client = new FakeClient();
const streamer = new LMStudioStreamer(client);
await expect(collect(streamer.stream({
modelName: '',
messages: [{ role: 'user', content: 'hi' }],
temperature: 0.2,
}))).rejects.toThrow(/without a model name/i);
});
test('mid-stream SDK failure is re-thrown when signal not aborted', async () => {
const client = new FakeClient(new FakeModel({ chunks: ['a', 'b'], failAfter: 1 }));
const streamer = new LMStudioStreamer(client);
await expect(collect(streamer.stream({
modelName: 'm1',
messages: [{ role: 'user', content: 'hi' }],
temperature: 0.2,
}))).rejects.toThrow(/mid-stream failure/);
});
test('mid-stream SDK failure swallowed if signal already aborted', async () => {
const client = new FakeClient(new FakeModel({ chunks: ['a', 'b'], failAfter: 1 }));
const streamer = new LMStudioStreamer(client);
const ac = new AbortController();
const iter = streamer.stream({
modelName: 'm1',
messages: [{ role: 'user', content: 'hi' }],
temperature: 0.2,
signal: ac.signal,
});
const out: string[] = [];
try {
for await (const { token } of iter) {
out.push(token);
ac.abort(); // abort right after first token, before failure point
}
} catch (e) {
// expected to be swallowed
}
expect(out).toEqual(['a']);
});
test('passes messages through to model.respond', async () => {
const client = new FakeClient();
const streamer = new LMStudioStreamer(client);
const messages = [
{ role: 'system' as const, content: 'sys' },
{ role: 'user' as const, content: 'hi' },
];
await collect(streamer.stream({ modelName: 'm1', messages, temperature: 0.5 }));
expect(client.model.lastChat).toEqual(messages);
});
});