SovereignBot/knowledge_distiller.py at main · NovasPlace/SovereignBot · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
"""Sovereign — Knowledge Distiller.

Every time NIM turbo fires, the organism learns permanently from the response.
If the local model and NIM gave similar answers, local already knew it — skip.
If there's a gap, encode the knowledge as a semantic memory so local improves.

"The turbo teaches, then fades." — Claude spec
"""
from __future__ import annotations

import logging
import re

log = logging.getLogger("sovereign.knowledge_distiller")

SIMILARITY_THRESHOLD = 0.85   # skip distillation if responses are this similar
MIN_RESPONSE_LENGTH = 30       # don't distill trivial one-liner answers


def _simple_similarity(text_a: str, text_b: str) -> float:
    """Word overlap Jaccard similarity — fast, no embeddings needed.

    Good enough to catch near-identical answers. For deeper similarity
    the Cortex neural layer can be plugged in later.
    """
    if not text_a or not text_b:
        return 0.0
    words_a = set(re.findall(r'\w+', text_a.lower()))
    words_b = set(re.findall(r'\w+', text_b.lower()))
    if not words_a or not words_b:
        return 0.0
    return len(words_a & words_b) / len(words_a | words_b)


class KnowledgeDistiller:
    """Encodes cloud response gaps into long-term Cortex memory.

    Called after every NIM turbo response to teach the local model what it
    didn't know. Over time the turbo fires less and less.
    """

    def __init__(self, store) -> None:
        self._store = store
        self._distillations = 0   # session counter

    def learn(
        self,
        question: str,
        local_text: str,
        boosted_text: str,
        local_confidence: float = 0.5,
        boost_confidence: float = 0.8,
        user_id: str = "default",
    ) -> bool:
        """Potentially encode new knowledge from the NIM response.

        Returns True if knowledge was distilled, False if answers were similar.
        """
        # Skip trivial responses
        if len(boosted_text) < MIN_RESPONSE_LENGTH:
            return False

        # If local and NIM gave similar answers, local already knew this
        similarity = _simple_similarity(local_text, boosted_text)
        if similarity > SIMILARITY_THRESHOLD:
            log.debug("Distillation skipped — similarity=%.2f", similarity)
            return False

        # Knowledge gap exists — encode permanently
        knowledge_gap = boost_confidence - local_confidence
        importance = min(0.9, 0.5 + knowledge_gap)

        from .models import MemoryEntry, MemorySource
        self._store.save_memory(MemoryEntry(
            content=f"Q: {question}\nA: {boosted_text[:500]}",
            source=MemorySource.AGENT,
            confidence=boost_confidence * 0.85,   # external source penalty
            session_id="distilled",
        ))

        self._distillations += 1
        log.info(
            "Knowledge distilled: similarity=%.2f gap=%.2f importance=%.2f "
            "session_total=%d",
            similarity, knowledge_gap, importance, self._distillations,
        )
        return True

    @property
    def distillation_count(self) -> int:
        return self._distillations