feat: ConnectAI structural hardening and retrieval precision improvements

This commit is contained in:
g1nation
2026-05-05 21:37:45 +09:00
parent c2f17cfb03
commit 466e9e4d5f
17 changed files with 424 additions and 160 deletions
+10 -2
View File
@@ -77,10 +77,18 @@ describe('Scoring Engine Unit Tests (v2.72.0)', () => {
// Language boundary split should handle alternating chars
expect(tokens).toContain('astra');
expect(tokens).toContain('v2');
expect(tokens).toContain('v2.0'); // [Structural Fix] 점(.)이 포함된 버전 번호 보존 확인
expect(tokens).toContain('한');
expect(tokens).toContain('글');
// Symbols should be filtered out
// [New Feature] 기술 기호 보존 확인 (C++, C#, .net)
const techText = 'I love C++ and C# programming on .net platform.';
const techTokens = tokenize(techText);
expect(techTokens).toContain('c++');
expect(techTokens).toContain('c#');
expect(techTokens).toContain('.net');
// Symbols should be filtered out (except the preserved ones)
expect(tokens.some(t => /^[!@#$]+$/.test(t))).toBe(false);
});