feat: 검색에서 kind/tag/search_keywords 활용 — FTS + 랭킹 부스트

SonAIengine · claude · SonAIengine · commit 412a7784b997 · 2026-03-22T14:06:49.000+09:00
## FTS 개선 (memory.py)
- tag 매칭 가중치 0.5→1.0 (핵심 주제 반영)
- properties["_search_keywords"] 매칭 추가 (LLM 생성 검색 키워드, 가중치 1.5)
- properties["_summary"] 매칭 추가 (LLM 생성 요약, 가중치 0.5)

## 랭킹 부스트 (search.py)
- kind-intent 부스트: 쿼리에 "실패"→LESSON, "정책"→RULE 등 매칭 시 +0.05
- tag-query 부스트: 쿼리 키워드가 노드 태그에 정확 매칭 시 +0.03/태그
- 보수적 부스트로 범용 태그에 의한 노이즈 최소화

## Ablation 결과
- S1 +Ontology: S0 대비 -0.1% (이전 -0.8%) → 거의 중립 달성
- 규칙 기반 태그의 구조적 한계 — LLM 태그에서 효과 기대

Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/src/synaptic/backends/memory.py b/src/synaptic/backends/memory.py
@@ -125,7 +125,16 @@ async def search_fts(self, query: str, *, limit: int = 20) -> list[Node]:
             # Tag 매칭 보너스
             if node.tags:
                 tag_text = " ".join(node.tags).lower()
-                score += sum(0.5 for t in terms if t in tag_text)
+                score += sum(1.0 for t in terms if t in tag_text)
+
+            # _search_keywords 매칭 (LLM이 생성한 검색 최적화 키워드)
+            if node.properties:
+                search_kw = node.properties.get("_search_keywords", "").lower()
+                if search_kw:
+                    score += sum(1.5 for t in terms if t in search_kw)
+                summary = node.properties.get("_summary", "").lower()
+                if summary:
+                    score += sum(0.5 for t in terms if t in summary)
 
             if score > 0:
                 scored.append((node, score))
diff --git a/src/synaptic/search.py b/src/synaptic/search.py
@@ -9,6 +9,31 @@
 from synaptic.resonance import ResonanceScorer
 from synaptic.synonyms import expand_synonyms
 
+# Kind-query 키워드 매핑 (쿼리에 이런 단어가 있으면 해당 kind 부스트)
+_KIND_QUERY_HINTS: dict[NodeKind, list[str]] = {
+    NodeKind.LESSON: [
+        "실패", "에러", "오류", "장애", "교훈", "배운", "주의",
+        "failure", "error", "incident", "lesson", "postmortem",
+    ],
+    NodeKind.RULE: [
+        "규칙", "정책", "규정", "금지", "필수", "가이드",
+        "rule", "policy", "constraint", "must", "forbidden",
+    ],
+    NodeKind.DECISION: [
+        "결정", "선택", "판단", "채택", "어떻게",
+        "decision", "choice", "decided", "approach",
+    ],
+    NodeKind.ARTIFACT: [
+        "api", "엔드포인트", "스키마", "명세", "코드",
+        "endpoint", "schema", "spec", "interface",
+    ],
+    NodeKind.ENTITY: [
+        "회사", "조직", "제품", "서비스", "시스템",
+        "company", "organization", "product", "service",
+    ],
+}
+_KIND_BOOST = 0.05  # kind 매칭 시 search_score 부스트량 (보수적)
+
 
 class HybridSearch:
     """3-stage fallback search: FTS+vector → synonym expansion → query rewrite."""
@@ -107,10 +132,30 @@ async def search(
                 if node.kind in kind_set
             }
 
+        # Kind-intent boost: 쿼리 키워드와 매칭되는 kind에 부스트
+        preferred_kinds: set[NodeKind] = set()
+        q_lower = query.lower()
+        for kind, hints in _KIND_QUERY_HINTS.items():
+            if any(h in q_lower for h in hints):
+                preferred_kinds.add(kind)
+
+        # Tag-query boost: 쿼리 키워드가 노드 태그에 있으면 부스트
+        query_terms_set = set(query.lower().split())
+
         # Score with resonance
         now = time()
         activated: list[ActivatedNode] = []
         for _nid, (node, search_score) in all_nodes.items():
+            # kind 부스트
+            if preferred_kinds and node.kind in preferred_kinds:
+                search_score = min(1.0, search_score + _KIND_BOOST)
+            # tag 부스트 (정확 매칭만 — 2글자 이상 태그만)
+            if node.tags and query_terms_set:
+                tag_set = {t.lower() for t in node.tags if len(t) >= 2}
+                tag_overlap = len(query_terms_set & tag_set)
+                if tag_overlap > 0:
+                    search_score = min(1.0, search_score + tag_overlap * 0.03)
+
             resonance = self._scorer.score(node, search_score=search_score, now=now)
             activated.append(
                 ActivatedNode(