feat: LLM 기반 온톨로지 보정 — verify_relations + suggest_missing

SonAIengine · claude · SonAIengine · commit 0927bbb6a74a · 2026-03-22T18:27:51.000+09:00
## 새 메서드

### verify_relations(relations, tools)
- heuristic이 생성한 관계를 LLM이 keep/reject 판정
- E-Commerce 46 tools: 71개 → 52개 kept, 19개 rejected (45초)
- reject 정확도 높음: getUser REQUIRES createUser (X), *REQUIRES createProductReview (X)

### suggest_missing(tools, existing)
- 기존 관계에서 빠진 워크플로우 의존성 제안
- createUser→getUser, createProduct→getProduct 등 5개 추가

## 프롬프트 최적화
- verify: 간결한 keep/reject 판정 프롬프트 (tools_context 제거)
- suggest: 기존 관계 참조하여 gap 찾기
- qwen2.5:14b 기준 71개 검증 45초, 5개 제안 9초

## 전체 온톨로지 파이프라인
1. Heuristic (dependency.py): 71개 관계 자동 생성
2. LLM verify: 19개 false positive 제거 → 52개
3. LLM suggest: 5개 빠진 관계 추가 → 57개
4. 수동 편집 (workflow editor): 최종 보정

Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/graph_tool_call/ontology/llm_provider.py b/graph_tool_call/ontology/llm_provider.py
@@ -94,6 +94,33 @@ class InferredRelation:
 
 Output ONLY a JSON object: {{"tool_name": ["query1", "query2"]}}"""
 
+_VERIFY_RELATIONS_PROMPT = """\
+Review these API relationships. Reply "keep" or "reject" for each.
+
+Example:
+- addToCart REQUIRES getProduct → keep (needs product ID)
+- listUsers REQUIRES createUser → reject (listing works without creation)
+
+Relations:
+{relations_list}
+
+Output ONLY JSON: [{{"source":"toolA","target":"toolB","verdict":"keep"}}]"""
+
+_SUGGEST_MISSING_PROMPT = """\
+Given these API tools and their existing relationships, suggest important \
+MISSING relationships. Focus on workflow dependencies: which tool must \
+run before which other tool?
+
+Tools:
+{tools_list}
+
+Existing relationships:
+{existing_relations}
+
+Suggest 3-5 missing relationships that are clearly needed for common workflows.
+Output ONLY a JSON array:
+[{{"source":"toolA","target":"toolB","relation":"PRECEDES","confidence":0.9,"reason":"..."}}]"""
+
 
 def _format_tools_list(tools: list[ToolSummary]) -> str:
     lines = []
@@ -244,6 +271,101 @@ def suggest_categories(
 
         return {}
 
+    def verify_relations(
+        self,
+        relations: list[InferredRelation],
+        tools: list[ToolSummary],
+        batch_size: int = 10,
+    ) -> tuple[list[InferredRelation], list[InferredRelation]]:
+        """Verify auto-detected relations using the LLM.
+
+        Returns (kept, rejected) — two lists of relations.
+        The LLM reviews each relation and decides keep/reject/fix.
+        """
+        kept: list[InferredRelation] = []
+        rejected: list[InferredRelation] = []
+
+        for i in range(0, len(relations), batch_size):
+            batch = relations[i : i + batch_size]
+            rels_text = "\n".join(
+                f"- {r.source} {r.relation_type.name} {r.target} ({r.reason[:60]})"
+                for r in batch
+            )
+            prompt = _VERIFY_RELATIONS_PROMPT.format(
+                relations_list=rels_text,
+            )
+            response = self.generate(prompt)
+
+            try:
+                parsed = _extract_json(response)
+                if not isinstance(parsed, list):
+                    # If parsing fails, keep all (conservative)
+                    kept.extend(batch)
+                    continue
+
+                verdict_map = {
+                    (item.get("source", ""), item.get("target", "")): item.get("verdict", "keep")
+                    for item in parsed
+                    if isinstance(item, dict)
+                }
+
+                for rel in batch:
+                    verdict = verdict_map.get((rel.source, rel.target), "keep")
+                    if verdict == "reject":
+                        rejected.append(rel)
+                    else:
+                        kept.append(rel)
+
+            except (json.JSONDecodeError, KeyError, TypeError):
+                # On parse failure, keep all (conservative)
+                kept.extend(batch)
+
+        return kept, rejected
+
+    def suggest_missing(
+        self,
+        tools: list[ToolSummary],
+        existing_relations: list[InferredRelation],
+    ) -> list[InferredRelation]:
+        """Suggest missing relations that the heuristic missed.
+
+        The LLM sees the current tools and relations, then suggests
+        important workflow dependencies that are absent.
+        """
+        tools_text = _format_tools_list(tools[:30])
+        existing_text = "\n".join(
+            f"- {r.source} {r.relation_type.name} {r.target}"
+            for r in existing_relations[:30]
+        )
+        prompt = _SUGGEST_MISSING_PROMPT.format(
+            tools_list=tools_text,
+            existing_relations=existing_text or "(none)",
+        )
+        response = self.generate(prompt)
+
+        suggestions: list[InferredRelation] = []
+        try:
+            parsed = _extract_json(response)
+            if not isinstance(parsed, list):
+                return suggestions
+            for item in parsed:
+                rel_type = _parse_relation_type(item.get("relation", ""))
+                if rel_type is None:
+                    continue
+                suggestions.append(
+                    InferredRelation(
+                        source=item["source"],
+                        target=item["target"],
+                        relation_type=rel_type,
+                        confidence=float(item.get("confidence", 0.8)),
+                        reason=item.get("reason", "LLM suggested"),
+                    )
+                )
+        except (json.JSONDecodeError, KeyError, TypeError):
+            pass
+
+        return suggestions
+
     def enrich_keywords(
         self,
         tools: list[ToolSummary],