Synapse/python/synapse/memory/moneta_store.py at master · JosephOIbrahim/Synapse · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
"""MonetaBackedStore — SYNAPSE MemoryStore backed by the Moneta engine (Mile 4).

Replaces the JSONL ``MemoryStore`` so the two-store divergence, the dead gauge,
and the empty stubs become *structurally* impossible: there is one store, and
``count()`` reads the engine's live entity count directly.

Mapping:
  * Each SYNAPSE ``Memory`` is serialized whole (``Memory.to_json()``) into a
    Moneta deposit's ``payload`` — it round-trips byte-for-byte.
  * ``content`` is embedded (pinned ``Embedder``) for vector recall.
  * Importance signals (decision / SHOW tier / gate source) map to a
    ``protected_floor`` so pinned memories resist Moneta's time-decay.
  * Reads enumerate the engine (``ecs.iter_rows``), deserialize payloads back
    to ``Memory``, and apply SYNAPSE's filtering/scoring here. Keyword recall is
    preserved exactly (see :func:`score_memories`); vector recall is a
    deliberate later upgrade, measured against keyword recall in shadow first.

This class is pure logic over an injected, caller-owned Moneta handle (Moneta
enforces single-owner URI locking). The factory :meth:`from_storage_dir` builds
a durable handle; tests inject an ephemeral one.
"""

from __future__ import annotations

import logging
import threading
from dataclasses import dataclass, field
from pathlib import Path
from typing import Dict, Iterable, List, Optional

from .models import Memory, MemoryQuery, MemorySearchResult, MemoryTier, MemoryType

logger = logging.getLogger(__name__)

# Importance -> protected_floor. Pinned memories resist Moneta's decay.
_DEFAULT_PROTECTED_FLOOR = 0.9


@dataclass(frozen=True)
class PruneAudit:
    """What a sleep pass actually removed — the lossless prune record.

    ``run_sleep_pass`` is the one destructive memory op (it permanently prunes
    unprotected memories). Moneta's ``ConsolidationResult`` reports only counts;
    this captures the ids + payloads + types of what was removed, so data loss
    is never silent. Back-compatible: ``.pruned``/``.staged``/``.attention_updated``
    mirror the old return shape.
    """

    pruned_ids: List[str] = field(default_factory=list)          # SYNAPSE Memory.id
    pruned_entity_ids: List[str] = field(default_factory=list)   # Moneta UUID (str)
    pruned_payloads: Dict[str, str] = field(default_factory=dict)
    pruned_types: Dict[str, str] = field(default_factory=dict)
    count_before: int = 0
    count_after: int = 0
    attention_updated: int = 0
    staged: int = 0

    @property
    def pruned(self) -> int:
        return len(self.pruned_entity_ids)


def score_memories(
    memories: Iterable[Memory], query: MemoryQuery
) -> List[MemorySearchResult]:
    """Faithful re-implementation of ``MemoryStore.search`` scoring (parity target).

    The narrowing predicates mirror the by_type / by_tag / by_keyword index
    narrowing (raw, case-sensitive tag match — matching ``search``, not
    ``get_by_tag``); the scoring mirrors the tag/keyword/text weights and the
    ``(-score, id)`` deterministic sort. Kept standalone so the JSONL store is
    untouched; Mile 5's shadow harness measures any divergence empirically.
    """
    pool = list(memories)
    if query.memory_types:
        types = set(query.memory_types)
        pool = [m for m in pool if m.memory_type in types]
    if query.tags:
        qtags = set(query.tags)
        pool = [m for m in pool if qtags & set(m.tags)]
    if query.keywords:
        qkw = set(query.keywords)
        pool = [m for m in pool if qkw & set(m.keywords)]

    results: List[MemorySearchResult] = []
    for memory in pool:
        if memory.is_consolidated and not query.include_consolidated:
            continue
        if query.tier and memory.tier != query.tier:
            continue
        if query.source and memory.source != query.source:
            continue
        if query.since and memory.created_at < query.since:
            continue
        if query.until and memory.created_at > query.until:
            continue

        score = 0.0
        match_reasons: List[str] = []

        if query.tags:
            matching_tags = set(query.tags) & set(memory.tags)
            if matching_tags:
                score += len(matching_tags) * 0.2
                match_reasons.append(f"tags: {', '.join(matching_tags)}")
        if query.keywords:
            matching_keywords = set(query.keywords) & set(memory.keywords)
            if matching_keywords:
                score += len(matching_keywords) * 0.2
                match_reasons.append(f"keywords: {', '.join(matching_keywords)}")
        if query.text:
            text_lower = query.text.lower()
            content_lower = memory.content.lower()
            summary_lower = memory.summary.lower()
            if text_lower in content_lower:
                score += 0.5
                match_reasons.append("content match")
            if text_lower in summary_lower:
                score += 0.3
                match_reasons.append("summary match")
            words = text_lower.split()
            word_matches = sum(
                1 for w in words if w in content_lower or w in summary_lower
            )
            if word_matches > 0:
                score += word_matches * 0.1
                match_reasons.append(f"{word_matches} word matches")

        if not query.text and not query.tags and not query.keywords:
            score = 0.5

        if score > 0:
            results.append(
                MemorySearchResult(
                    memory=memory,
                    score=min(1.0, score),
                    match_reasons=match_reasons,
                )
            )

    results.sort(key=lambda r: (-r.score, r.memory.id))
    if query.limit > 0:
        results = results[: query.limit]
    return results


class MonetaUpdateNotSupported(NotImplementedError):
    """Moneta is append/consolidate; in-place update/delete/clear is not clean."""


class MonetaBackedStore:
    """``MemoryStore``-compatible facade over a single Moneta handle."""

    def __init__(self, handle, embedder, *, protected_floor: float = _DEFAULT_PROTECTED_FLOOR):
        self._handle = handle
        self._embedder = embedder
        self._protected_floor = protected_floor
        # Stamp the embedder id onto the store so a future embedder swap can
        # detect entries that need re-embedding (handoff capsule PARKED note).
        self.embedder_id = getattr(embedder, "id", "unknown")
        # FC4: serialize ALL engine access. Moneta's ECS is single-writer —
        # concurrent deposit/iterate/prune corrupts its swap-and-pop index. This
        # RLock makes the adapter thread-safe by construction. It guards ONLY
        # in-process Python state and is never held across an hdefereval
        # main-thread hop (this adapter makes zero hou.* calls — see the
        # no-hou-import guard test), so it cannot deadlock the async server.
        # RLock (not Lock) because close() -> save() is a guarded-calls-guarded edge.
        self._lock = threading.RLock()

    # Protected memories (decisions / show-tier / gate) are exactly the
    # keep-forever set, so the per-handle protected quota is set high: Moneta's
    # default 100 is a backstop that would silently demote the 101st pin to
    # prunable (CRUCIBLE finding). We never want that for SYNAPSE.
    _PROTECTED_QUOTA = 100_000

    @classmethod
    def from_storage_dir(
        cls,
        storage_dir,
        embedder=None,
        *,
        protected_floor: float = _DEFAULT_PROTECTED_FLOOR,
        protected_quota: int = _PROTECTED_QUOTA,
    ) -> "MonetaBackedStore":
        """Build a durable, project-scoped Moneta-backed store.

        Snapshot + WAL live under ``<storage_dir>/.moneta/``; the ``storage_uri``
        is stable per project dir so the URI lock and snapshot reload key are
        consistent across restarts. The background snapshot daemon is NOT
        started here — under the async server it races the ECS single-writer
        (FC4). Persistence is via :meth:`save` (synchronous snapshot).

        A corrupt snapshot is quarantined (renamed, preserved) and the store
        starts fresh, rather than crashing startup or silently abandoning the
        file — Moneta's ``hydrate()`` does a bare ``json.load`` (CRUCIBLE finding).
        """
        from .embedding import HashEmbedder
        from . import moneta_runtime as mr

        if not mr.moneta_available():
            raise RuntimeError(
                f"Moneta backend requested but not importable: {mr.import_error()}"
            )
        embedder = embedder or HashEmbedder()
        base = Path(storage_dir) / ".moneta"
        base.mkdir(parents=True, exist_ok=True)
        snapshot_path = base / "snapshot.json"
        cls._quarantine_if_corrupt(snapshot_path)
        cfg = mr.MonetaConfig(
            storage_uri=f"moneta-file://{Path(storage_dir).resolve().as_posix()}",
            embedding_dim=embedder.dim,
            quota_override=protected_quota,
            snapshot_path=snapshot_path,
            wal_path=base / "wal.log",
        )
        handle = mr.Moneta(cfg)
        return cls(handle, embedder, protected_floor=protected_floor)

    _SNAPSHOT_REQUIRED_KEYS = (
        "entity_id", "payload", "semantic_vector", "utility",
        "attended_count", "protected_floor", "last_evaluated", "state",
    )

    @classmethod
    def _quarantine_if_corrupt(cls, snapshot_path: Path) -> None:
        """Rename a corrupt snapshot aside so startup neither crashes nor
        silently discards it. Best-effort; a valid/absent snapshot is untouched."""
        if not snapshot_path.exists():
            return
        import json
        import time as _time
        try:
            with open(snapshot_path, "r", encoding="utf-8") as fp:
                data = json.load(fp)
            if not isinstance(data, dict) or not isinstance(data.get("rows", []), list):
                raise ValueError("snapshot missing a 'rows' list")
            for row in data.get("rows", []):
                if not all(k in row for k in cls._SNAPSHOT_REQUIRED_KEYS):
                    raise ValueError("snapshot row missing required keys")
        except Exception as exc:
            bad = snapshot_path.with_name(f"{snapshot_path.name}.corrupt-{int(_time.time())}")
            try:
                snapshot_path.replace(bad)
                logger.error(
                    "Quarantined corrupt Moneta snapshot %s -> %s (%s); starting fresh",
                    snapshot_path, bad, exc,
                )
            except Exception as move_err:  # last resort: remove so startup proceeds
                logger.error(
                    "Corrupt snapshot %s unrecoverable (%s); removing", snapshot_path, move_err
                )
                try:
                    snapshot_path.unlink()
                except OSError:
                    pass

    # -- write --------------------------------------------------------------

    def _is_protected(self, memory: Memory) -> bool:
        return (
            memory.memory_type == MemoryType.DECISION
            or memory.tier == MemoryTier.SHOW
            or memory.source == "gate"
        )

    def add(self, memory: Memory) -> str:
        text = memory.content or memory.summary or ""
        embedding = self._embedder.embed(text)
        payload = memory.to_json()
        floor = self._protected_floor if self._is_protected(memory) else 0.0
        with self._lock:
            try:
                self._handle.deposit(payload, embedding, protected_floor=floor)
            except Exception as exc:  # ProtectedQuotaExceededError, etc.
                if floor > 0.0:
                    # Never drop a memory because the protected quota is full.
                    logger.warning(
                        "Protected deposit failed (%s); storing unprotected: %s",
                        type(exc).__name__, exc,
                    )
                    self._handle.deposit(payload, embedding, protected_floor=0.0)
                else:
                    raise
        return memory.id

    # -- enumerate (the one coupling to Moneta internals, centralized) ------

    def _iter_memories(self) -> List[Memory]:
        # Snapshot the engine under the lock and return a list — NOT a generator.
        # A lazy generator would hold the lock across caller work (or until GC if
        # abandoned). Materializing the rows under the lock gives every read an
        # atomic point-in-time view; the expensive JSON deserialization runs
        # lock-free. All read methods inherit safety from this single snapshot.
        with self._lock:
            rows = list(self._handle.ecs.iter_rows())
        return [Memory.from_json(row.payload) for row in rows]

    # -- read ---------------------------------------------------------------

    def count(self) -> int:
        with self._lock:
            return self._handle.ecs.n

    def all(self) -> List[Memory]:
        return list(self._iter_memories())

    def get(self, memory_id: str) -> Optional[Memory]:
        for m in self._iter_memories():
            if m.id == memory_id:
                return m
        return None

    def get_recent(self, limit: int = 10) -> List[Memory]:
        return sorted(
            self._iter_memories(), key=lambda m: m.created_at, reverse=True
        )[:limit]

    def get_by_type(self, memory_type: MemoryType) -> List[Memory]:
        return [m for m in self._iter_memories() if m.memory_type == memory_type]

    def get_by_tag(self, tag: str) -> List[Memory]:
        # Raw, case-sensitive — matches search() tag semantics across stores.
        return [m for m in self._iter_memories() if tag in m.tags]

    def get_linked(self, memory_id: str) -> List[Memory]:
        all_mems = list(self._iter_memories())
        src = next((m for m in all_mems if m.id == memory_id), None)
        if src is None:
            return []
        targets = {link.target_id for link in src.links}
        return [m for m in all_mems if m.id in targets]

    def search(self, query: MemoryQuery) -> List[MemorySearchResult]:
        return score_memories(self._iter_memories(), query)

    # -- lifecycle ----------------------------------------------------------

    def save(self) -> None:
        """Durably snapshot the engine. No-op when durability is disabled (ephemeral)."""
        with self._lock:
            dur = getattr(self._handle, "durability", None)
            if dur is not None:
                try:
                    dur.snapshot_ecs(self._handle.ecs)
                except Exception as exc:
                    logger.warning("Moneta snapshot on save() failed: %s", exc)

    def run_sleep_pass(self) -> PruneAudit:
        """Trigger Moneta consolidation/decay — AUDITABLE and serialized.

        This is the one destructive memory op: it permanently prunes unprotected
        memories. We enumerate the live id-set + payloads BEFORE the pass, run it,
        then diff the survivors to recover exactly which entities were pruned —
        so data loss is logged, never silent. Held under the lock (the prune
        mutates the ECS and must not interleave with deposit/iterate).
        """
        with self._lock:
            ecs = self._handle.ecs
            before_payload: Dict[str, str] = {}
            before_mem: Dict[str, Optional[Memory]] = {}
            for row in ecs.iter_rows():
                eid = str(row.entity_id)
                before_payload[eid] = row.payload
                try:
                    before_mem[eid] = Memory.from_json(row.payload)
                except Exception:
                    before_mem[eid] = None  # keep the raw payload for forensics
            count_before = ecs.n

            result = self._handle.run_sleep_pass()

            survivors = {str(row.entity_id) for row in ecs.iter_rows()}
            count_after = ecs.n

        pruned_eids = [eid for eid in before_payload if eid not in survivors]
        pruned_ids: List[str] = []
        pruned_types: Dict[str, str] = {}
        for eid in pruned_eids:
            mem = before_mem.get(eid)
            if mem is not None:
                pruned_ids.append(mem.id)
                pruned_types[mem.id] = getattr(mem.memory_type, "value", str(mem.memory_type))

        audit = PruneAudit(
            pruned_ids=pruned_ids,
            pruned_entity_ids=pruned_eids,
            pruned_payloads={eid: before_payload[eid] for eid in pruned_eids},
            pruned_types=pruned_types,
            count_before=count_before,
            count_after=count_after,
            attention_updated=getattr(result, "attention_updated", 0),
            staged=getattr(result, "staged", 0),
        )
        if audit.pruned:
            logger.warning(
                "moneta.prune lossless-audit pruned=%d staged=%d before=%d after=%d ids=%s",
                audit.pruned, audit.staged, count_before, count_after, pruned_ids,
            )
        else:
            logger.info(
                "moneta.sleep_pass pruned=0 staged=%d attended=%d n=%d",
                audit.staged, audit.attention_updated, count_after,
            )
        return audit

    def close(self) -> None:
        with self._lock:
            self.save()
            close = getattr(self._handle, "close", None)
            if callable(close):
                close()

    # -- unsupported (append/consolidate engine) ----------------------------

    def update(self, memory: Memory):
        raise MonetaUpdateNotSupported(
            "MonetaBackedStore is append/consolidate; in-place update is not "
            "supported. Re-add as a new memory or trigger consolidation."
        )

    def delete(self, memory_id: str) -> bool:
        raise MonetaUpdateNotSupported(
            "MonetaBackedStore does not support targeted delete; pruning is "
            "handled by run_sleep_pass() decay/consolidation."
        )

    def clear(self):
        raise MonetaUpdateNotSupported(
            "MonetaBackedStore.clear() is unsupported on a live handle; "
            "construct a fresh handle for a clean store."
        )