Initial release: iai-mcp v0.1.0

Co-Authored-By: Claude <noreply@anthropic.com> Co-Authored-By: XNLLLLH <XNLLLLH@users.noreply.github.com>
2026-05-06 01:04:47 -07:00 · 2026-05-06 01:04:47 -07:00 · f6b876fbe7
commit f6b876fbe7
332 changed files with 97258 additions and 0 deletions
--- a/src/iai_mcp/s4.py
+++ b/src/iai_mcp/s4.py
@ -0,0 +1,459 @@
+"""S4 viability -- on-read consistency + monotropic proactive checks (MEM-08, D-17).
+
+D-17 constitutional:
+- (e) on-read consistency: runs inside `pipeline_recall` on top-K returned
+  records. Pairwise cosine with ART vigilance ρ_s4=0.97 + `contradicts`
+  edge lookup. Emits `s4_contradiction` events. Populates
+  `RecallResponse.hints`.
+- (f) monotropic proactive: only fires when profile.monotropism_depth[domain]
+  > 0.7 AND new_record.detail_level >= 4. Scans within-domain only.
+  Performance guard: if domain > 100 records, skip with warning event.
+
+Plan 03-02 CONN-07 addition:
+- `run_offline_pass(store)` -- new entry point, CALLED by the daemon /
+  session_exit hook. Currently runs `sigma.compute_and_emit(store)` only;
+  future plans append more offline-pass items here. Failures emit
+  `kind="s4_error"` and never crash the pass.
+
+Explicitly forbidden (D-17 negative assertions):
+- NO `daily_scan` function (Ashby Requisite Variety violation).
+- NO `session_exit_sweep` function (Anderson activation-based violation).
+
+All detected contradictions go through `events.write_event` -- no .jsonl files
+(D-STORAGE).
+"""
+from __future__ import annotations
+
+from uuid import UUID
+
+import numpy as np
+
+from iai_mcp.events import write_event
+from iai_mcp.store import MemoryStore
+from iai_mcp.types import MemoryHit, MemoryRecord
+
+
+# D-17(e) vigilance: 0.97 for near-duplicate contradiction detection.
+# Stricter than write-path ρ=0.95: we only flag VERY close matches.
+S4_VIGILANCE_RHO = 0.97
+
+# D-17(f) performance guard: skip when domain has > this many records.
+MONOTROPIC_MAX_PAIRWISE = 100
+
+# D-17(f) monotropism-depth threshold.
+S4_MONOTROPIC_THETA = 0.7
+
+
+def _cosine(a: list[float], b: list[float]) -> float:
+    """Cosine similarity in [-1, 1]. Returns 0.0 on zero-norm inputs."""
+    av = np.asarray(a, dtype=np.float32)
+    bv = np.asarray(b, dtype=np.float32)
+    na = float(np.linalg.norm(av))
+    nb = float(np.linalg.norm(bv))
+    if na == 0.0 or nb == 0.0:
+        return 0.0
+    return float(np.dot(av, bv) / (na * nb))
+
+
+def on_read_check(
+    store: MemoryStore,
+    hits: list[MemoryHit],
+    session_id: str,
+) -> list[dict]:
+    """D-17(e) on-read consistency check.
+
+    Two detection paths, both run per-retrieval on the top-K hits:
+
+    1. `contradicts`-edge authoritative: any pair of hits connected by an
+       existing `contradicts` edge is flagged regardless of cosine. This is
+       the definitive route -- the user (or a prior S4 run) already said
+       "these two disagree", so we surface it every time they co-retrieve.
+
+    2. Cosine + tag-polarity heuristic: pairs with cosine >= ρ_s4 (0.97) AND
+       conflicting polarity tags ({positive,negative} or {asserted,retracted})
+       are flagged as `info`-severity. or can replace this
+       with NLI-based semantic contradiction.
+
+    Returns a list of hint dicts; each dict is shaped per
+    RecallResponse.hints contract. Also writes one `s4_contradiction` event
+    per detected pair to the LanceDB events table (D-STORAGE).
+
+    note: `on_read_check_batch` is the D-SPEED variant. It accepts
+    an optional `records_cache` kwarg so pipeline_recall can reuse the cache
+    it already built at stage 1 (zero extra store.get calls). This function
+    is preserved as the back-compat / ad-hoc caller API (retrieve.recall
+    still calls it; no records_cache available there).
+    """
+    if len(hits) < 2:
+        return []
+
+    hint_list: list[dict] = []
+
+    # Load records for the hit ids. Missing records are skipped silently -- a
+    # recent store.delete could race us.
+    records: dict[UUID, MemoryRecord] = {}
+    for h in hits:
+        rec = store.get(h.record_id)
+        if rec is not None:
+            records[h.record_id] = rec
+    if len(records) < 2:
+        return []
+
+    # Load contradicts edges among these records. We precompute the set of
+    # (sorted src,dst) pairs so the pairwise loop below is O(1) lookup.
+    contradict_pairs: set[tuple[str, str]] = set()
+    try:
+        edges_df = store.db.open_table("edges").to_pandas()
+    except Exception:
+        edges_df = None
+    if edges_df is not None and not edges_df.empty:
+        contradict_df = edges_df[edges_df["edge_type"] == "contradicts"]
+        hit_ids = {str(h.record_id) for h in hits}
+        for _, row in contradict_df.iterrows():
+            src = row["src"]
+            dst = row["dst"]
+            if src in hit_ids and dst in hit_ids:
+                contradict_pairs.add(tuple(sorted([src, dst])))
+
+    # Pairwise scan across hit records.
+    hit_records = list(records.values())
+    for i in range(len(hit_records)):
+        for j in range(i + 1, len(hit_records)):
+            a = hit_records[i]
+            b = hit_records[j]
+            key = tuple(sorted([str(a.id), str(b.id)]))
+            sim = _cosine(a.embedding, b.embedding)
+
+            # Path 1: explicit edge is authoritative.
+            if key in contradict_pairs:
+                hint = {
+                    "kind": "s4_contradiction",
+                    "severity": "warning",
+                    "source_ids": [str(a.id), str(b.id)],
+                    "text": (
+                        f"inconsistency: records have a contradicts edge; "
+                        f"review {a.id}, {b.id}"
+                    ),
+                    "similarity": sim,
+                }
+                hint_list.append(hint)
+                write_event(
+                    store,
+                    kind="s4_contradiction",
+                    data={
+                        "source_ids": list(key),
+                        "similarity": sim,
+                        "mechanism": "contradicts_edge",
+                    },
+                    severity="warning",
+                    session_id=session_id,
+                    source_ids=[a.id, b.id],
+                )
+                continue
+
+            # Path 2: cosine + polarity-tag heuristic.
+            if sim >= S4_VIGILANCE_RHO:
+                a_tags = set(a.tags or [])
+                b_tags = set(b.tags or [])
+                polarity_conflict = (
+                    ("positive" in a_tags and "negative" in b_tags)
+                    or ("negative" in a_tags and "positive" in b_tags)
+                    or ("asserted" in a_tags and "retracted" in b_tags)
+                    or ("retracted" in a_tags and "asserted" in b_tags)
+                )
+                if polarity_conflict:
+                    hint = {
+                        "kind": "s4_contradiction",
+                        "severity": "info",
+                        "source_ids": [str(a.id), str(b.id)],
+                        "text": (
+                            f"inconsistency: near-duplicate ({sim:.3f}) with "
+                            f"conflicting polarity tags"
+                        ),
+                        "similarity": sim,
+                    }
+                    hint_list.append(hint)
+                    write_event(
+                        store,
+                        kind="s4_contradiction",
+                        data={
+                            "source_ids": list(key),
+                            "similarity": sim,
+                            "mechanism": "tag_polarity",
+                        },
+                        severity="info",
+                        session_id=session_id,
+                        source_ids=[a.id, b.id],
+                    )
+    return hint_list
+
+
+def on_read_check_batch(
+    store: MemoryStore,
+    hits: list[MemoryHit],
+    session_id: str,
+    records_cache: "dict[UUID, MemoryRecord] | None" = None,
+) -> list[dict]:
+    """Plan 02-07 D-SPEED: batched variant of on_read_check.
+
+    Semantically identical to on_read_check (returns the same hint-shape list,
+    emits the same events). The ONLY difference is the record-loading step:
+
+    - If `records_cache` is provided, use it directly. ZERO store.get calls.
+    - Otherwise, do ONE `store.all_records()` call instead of N `store.get()`
+      calls. ZERO per-hit round-trips either way.
+
+    The pairwise contradiction-detection loop, the polarity-tag heuristic, the
+    vigilance threshold (S4_VIGILANCE_RHO), and the event-emission logic are
+    byte-for-byte equivalent to on_read_check.
+
+    Why this is the perf-critical surface (D-SPEED SC-6):
+    Pre-fix: pipeline_recall built records_cache at stage 1, then s4.on_read_check
+             called `store.get(h.record_id)` per hit -- every call is a full
+             to_pandas() scan (~140ms each at N=100 on executor hardware).
+    Post-fix: pipeline_recall passes records_cache through; s4 does zero extra
+             round-trips. Saves ~140ms per hit x N hits per recall.
+    """
+    if len(hits) < 2:
+        return []
+
+    hint_list: list[dict] = []
+
+    # Load records via cache (preferred) or one batched fallback.
+    records: dict[UUID, MemoryRecord] = {}
+    if records_cache is not None:
+        for h in hits:
+            rec = records_cache.get(h.record_id)
+            if rec is not None:
+                records[h.record_id] = rec
+    else:
+        all_recs = store.all_records()
+        by_id = {r.id: r for r in all_recs}
+        for h in hits:
+            rec = by_id.get(h.record_id)
+            if rec is not None:
+                records[h.record_id] = rec
+    if len(records) < 2:
+        return []
+
+    # Load contradicts edges among these records. One edges.to_pandas() scan
+    # (same as on_read_check).
+    contradict_pairs: set[tuple[str, str]] = set()
+    try:
+        edges_df = store.db.open_table("edges").to_pandas()
+    except Exception:
+        edges_df = None
+    if edges_df is not None and not edges_df.empty:
+        contradict_df = edges_df[edges_df["edge_type"] == "contradicts"]
+        hit_ids = {str(h.record_id) for h in hits}
+        for _, row in contradict_df.iterrows():
+            src = row["src"]
+            dst = row["dst"]
+            if src in hit_ids and dst in hit_ids:
+                contradict_pairs.add(tuple(sorted([src, dst])))
+
+    # Pairwise scan -- identical logic to on_read_check.
+    hit_records = list(records.values())
+    for i in range(len(hit_records)):
+        for j in range(i + 1, len(hit_records)):
+            a = hit_records[i]
+            b = hit_records[j]
+            key = tuple(sorted([str(a.id), str(b.id)]))
+            sim = _cosine(a.embedding, b.embedding)
+
+            # Path 1: explicit edge is authoritative.
+            if key in contradict_pairs:
+                hint = {
+                    "kind": "s4_contradiction",
+                    "severity": "warning",
+                    "source_ids": [str(a.id), str(b.id)],
+                    "text": (
+                        f"inconsistency: records have a contradicts edge; "
+                        f"review {a.id}, {b.id}"
+                    ),
+                    "similarity": sim,
+                }
+                hint_list.append(hint)
+                write_event(
+                    store,
+                    kind="s4_contradiction",
+                    data={
+                        "source_ids": list(key),
+                        "similarity": sim,
+                        "mechanism": "contradicts_edge",
+                    },
+                    severity="warning",
+                    session_id=session_id,
+                    source_ids=[a.id, b.id],
+                )
+                continue
+
+            # Path 2: cosine + polarity-tag heuristic.
+            if sim >= S4_VIGILANCE_RHO:
+                a_tags = set(a.tags or [])
+                b_tags = set(b.tags or [])
+                polarity_conflict = (
+                    ("positive" in a_tags and "negative" in b_tags)
+                    or ("negative" in a_tags and "positive" in b_tags)
+                    or ("asserted" in a_tags and "retracted" in b_tags)
+                    or ("retracted" in a_tags and "asserted" in b_tags)
+                )
+                if polarity_conflict:
+                    hint = {
+                        "kind": "s4_contradiction",
+                        "severity": "info",
+                        "source_ids": [str(a.id), str(b.id)],
+                        "text": (
+                            f"inconsistency: near-duplicate ({sim:.3f}) with "
+                            f"conflicting polarity tags"
+                        ),
+                        "similarity": sim,
+                    }
+                    hint_list.append(hint)
+                    write_event(
+                        store,
+                        kind="s4_contradiction",
+                        data={
+                            "source_ids": list(key),
+                            "similarity": sim,
+                            "mechanism": "tag_polarity",
+                        },
+                        severity="info",
+                        session_id=session_id,
+                        source_ids=[a.id, b.id],
+                    )
+    return hint_list
+
+
+def monotropic_proactive_check(
+    store: MemoryStore,
+    new_record: MemoryRecord,
+    profile_state: dict,
+    session_id: str,
+) -> list[dict]:
+    """D-17(f) monotropic proactive check.
+
+    Three gates (all must pass):
+
+    1. `profile_state["monotropism_depth"][domain] > θ_deep` (0.7). The user's
+       autistic profile indicates DEEP focus in this domain -- we're willing
+       to spend cycles checking for near-duplicates.
+    2. `new_record.detail_level >= 4`. Shallow records (detail 1-3) don't
+       warrant the pairwise scan.
+    3. `new_record` carries a `domain:<name>` tag. Records without a domain
+       tag are excluded (nothing to compare against).
+
+    Performance guard: if the domain has > MONOTROPIC_MAX_PAIRWISE records,
+    skip the scan and emit a `s4_monotropic_skip` warning event. The scan is
+    O(N) cosine comparisons; 100 is a reasonable ceiling.
+
+    Rule 1 deviation: if `profile_state["monotropism_depth"]` is not a dict
+    (type drift), degrade silently to empty hints (no exception).
+    """
+    md = profile_state.get("monotropism_depth", {})
+    if not isinstance(md, dict):
+        return []  # profile_state wrongly typed -- degrade silently
+
+    # Locate the record's domain tag ("domain:coding", "domain:gardening", ...)
+    domain_tag: str | None = next(
+        (t for t in (new_record.tags or []) if t.startswith("domain:")),
+        None,
+    )
+    if domain_tag is None:
+        return []
+
+    # Gate 1: monotropism depth must exceed θ_deep.
+    domain_name = domain_tag.split(":", 1)[1]
+    depth = md.get(domain_name, 0.0)
+    if depth <= S4_MONOTROPIC_THETA:
+        return []
+
+    # Gate 2: detail_level must be >= 4.
+    if new_record.detail_level < 4:
+        return []
+
+    # Load same-domain records (excluding the new record itself).
+    same_domain = [
+        r for r in store.all_records()
+        if (r.tags or []) and domain_tag in r.tags and r.id != new_record.id
+    ]
+
+    # Performance guard: skip + warn above ceiling.
+    if len(same_domain) > MONOTROPIC_MAX_PAIRWISE:
+        write_event(
+            store,
+            kind="s4_monotropic_skip",
+            data={
+                "domain": domain_tag,
+                "count": len(same_domain),
+                "record_id": str(new_record.id),
+            },
+            severity="warning",
+            domain=domain_tag,
+            session_id=session_id,
+        )
+        return []
+
+    hints: list[dict] = []
+    for r in same_domain:
+        sim = _cosine(new_record.embedding, r.embedding)
+        if sim >= S4_VIGILANCE_RHO:
+            hint = {
+                "kind": "s4_monotropic_contradiction",
+                "severity": "info",
+                "source_ids": [str(new_record.id), str(r.id)],
+                "text": (
+                    f"monotropic near-duplicate in {domain_tag}: sim={sim:.3f}"
+                ),
+                "similarity": sim,
+            }
+            hints.append(hint)
+            write_event(
+                store,
+                kind="s4_monotropic_contradiction",
+                data={
+                    "domain": domain_tag,
+                    "source_ids": [str(new_record.id), str(r.id)],
+                    "similarity": sim,
+                },
+                severity="info",
+                domain=domain_tag,
+                session_id=session_id,
+                source_ids=[new_record.id, r.id],
+            )
+    return hints
+
+
+def run_offline_pass(store: MemoryStore) -> dict:
+    """Plan 03-02 CONN-07: S4 offline-pass entry point.
+
+    Called by the daemon's offline cycle (or by session_exit / cron).
+    Currently runs ONE check: `sigma.compute_and_emit(store)` -- which writes
+    `kind=sigma_observation` (developmental / healthy / insufficient_data) OR
+    `kind=sigma_drift` (mid_life_drift) and (in developmental phase) bumps the
+    Hebbian rate via a `profile_updated` event.
+
+    Failures are caught and emitted as `kind="s4_error"`; the pass does NOT
+    crash. This mirrors the diagnostic discipline of `on_read_check`:
+    S4 work is observation, never blocks reads or writes.
+
+    Returns a dict with the per-step outcome:
+      {"sigma": <snapshot dict or {"error": "..."}>}
+    """
+    from iai_mcp import sigma  # local import; sigma is heavy (networkx)
+
+    out: dict = {}
+    try:
+        out["sigma"] = sigma.compute_and_emit(store)
+    except Exception as exc:  # noqa: BLE001 - diagnostic catch-all
+        try:
+            write_event(
+                store,
+                kind="s4_error",
+                data={"step": "sigma", "error": repr(exc)},
+                severity="warning",
+            )
+        except Exception:
+            pass
+        out["sigma"] = {"error": repr(exc)}
+    return out