fix(blackbox): address review blockers B1–B7 + re-capture proof bundle

A full multi-agent review found 7 real issues (4 blockers). All fixed + tested. B1 (blocker): Promoting a Memory PR did not release the quarantined memory — the UI said "promoted" while the memory stayed suppressed/out of retrieval. act_on_memory_pr now calls reverse_suppression(subject_id) on accept actions; MemoryPrAction::releases_memory() encodes the rule (promote/merge/supersede release; forget/quarantine keep it held). Proven live: PR response subjectReleased:true, SQLite suppression_count 0. B2 (blocker): memory promote/demote (returns `action`, not `decision`) and codebase remember_* writes bypassed the write-trace + PR gate. extract_writes now reads `action` too, filtered by is_write_decision (reads like get/state excluded); is_write_tool includes `codebase`. B3 (blocker): receipt ids collided within a run (r_<date>_<runId> + INSERT OR REPLACE overwrote earlier receipts). IDs are now r_<date>_<runId8>_<unique6>; build() mints the suffix, build_with_unique() keeps tests deterministic. B4 (blocker): proof bundle was assembled from two runs (trace.json=run_proof, websocket-events.jsonl=run_proof2). Re-captured the whole bundle from a single run — trace, websocket, receipt, and memory_pr all carry run_proof now. B5: Black Box receipts panel showed global latest, not the selected run. Added list_receipts_for_run + /api/receipts?run= ; the page uses listForRun. B6: SENSITIVE_TOPICS substring matching false-fired (tokenizer->token, author->auth, secretary->secret). Switched to word-boundary matching; real phrasings (auth token, security vulnerability, api key) still gate. B7: set_review_mode now writes atomically (temp+rename via write_atomic); export_trace sanitizes run_id in the Content-Disposition filename; memory-prs static routes declared before the dynamic /{id} route. Withdrawn: the /mode-vs-/{id} route order is NOT a functional bug (axum 0.8 / matchit prioritizes static segments) — reordered for clarity only. Gates: 999 lib tests pass (+9 new regressions), clippy -D warnings clean, dashboard check + build clean. Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
2026-07-02 22:01:01 +02:00 · 2026-06-22 18:46:14 -05:00 · 2026-06-22 18:46:14 -05:00 · 8f7bed0463
commit 8f7bed0463
parent cadffb419b
17 changed files with 486 additions and 63 deletions
--- a/crates/vestige-core/src/storage/trace_store.rs
+++ b/crates/vestige-core/src/storage/trace_store.rs
@ -282,6 +282,31 @@ impl SqliteMemoryStore {
        Ok(out)
    }

+    /// List the receipts belonging to one run, newest first (B5). The Black Box
+    /// receipts panel uses this so the receipts it shows actually belong to the
+    /// selected run, not the global latest.
+    pub fn list_receipts_for_run(&self, run_id: &str, limit: usize) -> Result<Vec<Receipt>> {
+        let reader = self
+            .reader
+            .lock()
+            .map_err(|_| StorageError::Init("Reader lock poisoned".into()))?;
+        let mut stmt = reader.prepare(
+            "SELECT payload FROM memory_receipts WHERE run_id = ?1
+             ORDER BY created_at DESC LIMIT ?2",
+        )?;
+        let rows = stmt.query_map(params![run_id, limit as i64], |row| {
+            let p: String = row.get(0)?;
+            Ok(p)
+        })?;
+        let mut out = Vec::new();
+        for r in rows {
+            if let Ok(rc) = serde_json::from_str::<Receipt>(&r?) {
+                out.push(rc);
+            }
+        }
+        Ok(out)
+    }
+
    // ========================================================================
    // MEMORY PRs — the risk-gated review queue
    // ========================================================================
@ -534,6 +559,37 @@ mod tests {
        assert_eq!(s.list_receipts(10).unwrap().len(), 1);
    }

+    #[test]
+    fn receipts_are_listable_per_run_b5() {
+        let s = store();
+        let mk = |id: &str| Receipt {
+            receipt_id: id.into(),
+            retrieved: vec!["m1".into()],
+            suppressed: vec![],
+            activation_path: vec![],
+            trust_floor: 0.9,
+            decay_risk: DecayRisk::Low,
+            mutations: vec![],
+        };
+        s.save_receipt(&mk("r_a1"), Some("run_a"), Some("search"), None)
+            .unwrap();
+        s.save_receipt(&mk("r_a2"), Some("run_a"), Some("search"), None)
+            .unwrap();
+        s.save_receipt(&mk("r_b1"), Some("run_b"), Some("search"), None)
+            .unwrap();
+
+        let run_a = s.list_receipts_for_run("run_a", 10).unwrap();
+        assert_eq!(run_a.len(), 2, "run_a has exactly its 2 receipts");
+        assert!(run_a.iter().all(|r| r.receipt_id.starts_with("r_a")));
+
+        let run_b = s.list_receipts_for_run("run_b", 10).unwrap();
+        assert_eq!(run_b.len(), 1, "run_b has only its own receipt");
+        assert_eq!(run_b[0].receipt_id, "r_b1");
+
+        // Global list still sees all three.
+        assert_eq!(s.list_receipts(10).unwrap().len(), 3);
+    }
+
    #[test]
    fn memory_pr_lifecycle() {
        let s = store();
@ -569,6 +625,39 @@ mod tests {
        assert_eq!(s.count_pending_memory_prs().unwrap(), 0);
    }

+    #[test]
+    fn promote_releases_a_quarantined_memory_end_to_end() {
+        // B1 regression: the full quarantine→release cycle at the storage layer.
+        // gate_writes suppresses a risky write; an accept action must reverse it.
+        let s = store();
+        let node = s
+            .ingest(crate::IngestInput {
+                content: "Risky write that got quarantined.".to_string(),
+                node_type: "fact".to_string(),
+                ..Default::default()
+            })
+            .expect("ingest");
+        assert_eq!(node.suppression_count, 0, "fresh node not suppressed");
+
+        // Quarantine it (what gate_writes does for a risky write).
+        let suppressed = s.suppress_memory(&node.id).expect("suppress");
+        assert_eq!(
+            suppressed.suppression_count, 1,
+            "quarantined write is suppressed (held out of retrieval)"
+        );
+
+        // Promote = release. (The action releases_memory() == true; the handler
+        // calls reverse_suppression on the subject.)
+        assert!(crate::MemoryPrAction::Promote.releases_memory());
+        let released = s
+            .reverse_suppression(&node.id, 24)
+            .expect("reverse suppression within labile window");
+        assert_eq!(
+            released.suppression_count, 0,
+            "promoting the PR must release the memory — not leave it suppressed"
+        );
+    }
+
    #[test]
    fn ask_agent_why_is_not_a_decision() {
        let s = store();
--- a/crates/vestige-core/src/trace/receipt.rs
+++ b/crates/vestige-core/src/trace/receipt.rs
@ -59,9 +59,13 @@ pub struct Receipt {
 impl Receipt {
    /// Build a receipt from already-computed retrieval signals.
    ///
-    /// `receipt_id` is derived from `now` + a short discriminator so it is both
-    /// human-legible and collision-resistant within a day. `trust_scores` is the
-    /// per-id FSRS retrievability/trust the pipeline already produced.
+    /// `receipt_id` is `r_<date>_<discriminator8>_<unique6>` — human-legible
+    /// and dated, with a short random suffix so that **multiple retrievals in
+    /// the same run never collide** (B3). The discriminator (usually the runId)
+    /// keeps receipts from one run visually grouped; the suffix guarantees
+    /// uniqueness so `INSERT OR REPLACE` can't overwrite an earlier receipt.
+    /// `trust_scores` is the per-id FSRS retrievability/trust the pipeline
+    /// already produced.
    pub fn build(
        now: chrono::DateTime<chrono::Utc>,
        discriminator: &str,
@ -70,6 +74,32 @@ impl Receipt {
        activation_path: Vec<String>,
        trust_scores: &[f64],
        mutations: Vec<ReceiptMutation>,
+    ) -> Self {
+        Self::build_with_unique(
+            now,
+            discriminator,
+            &uuid::Uuid::new_v4().simple().to_string()[..6],
+            retrieved,
+            suppressed,
+            activation_path,
+            trust_scores,
+            mutations,
+        )
+    }
+
+    /// Like [`Receipt::build`] but with a caller-supplied uniqueness token,
+    /// so the id is fully deterministic for tests. Production uses
+    /// [`Receipt::build`] which mints a random token.
+    #[allow(clippy::too_many_arguments)]
+    pub fn build_with_unique(
+        now: chrono::DateTime<chrono::Utc>,
+        discriminator: &str,
+        unique: &str,
+        retrieved: Vec<String>,
+        suppressed: Vec<SuppressedReceiptEntry>,
+        activation_path: Vec<String>,
+        trust_scores: &[f64],
+        mutations: Vec<ReceiptMutation>,
    ) -> Self {
        let trust_floor = trust_scores
            .iter()
@ -87,7 +117,17 @@ impl Receipt {
            .filter(|c| c.is_ascii_alphanumeric())
            .take(8)
            .collect();
-        let receipt_id = format!("r_{}_{}", now.format("%Y_%m_%d"), short);
+        let unique_clean: String = unique
+            .chars()
+            .filter(|c| c.is_ascii_alphanumeric())
+            .take(6)
+            .collect();
+        let receipt_id = format!(
+            "r_{}_{}_{}",
+            now.format("%Y_%m_%d"),
+            short,
+            unique_clean
+        );

        Self {
            receipt_id,
@ -182,16 +222,31 @@ mod tests {

    #[test]
    fn receipt_id_is_human_legible_and_dated() {
-        let r = Receipt::build(
+        let r = Receipt::build_with_unique(
            fixed_now(),
            "abc123!!",
+            "u1u2u3",
            vec!["mem_1".into()],
            vec![],
            vec![],
            &[0.9],
            vec![],
        );
-        assert_eq!(r.receipt_id, "r_2026_06_22_abc123");
+        assert_eq!(r.receipt_id, "r_2026_06_22_abc123_u1u2u3");
+    }
+
+    #[test]
+    fn receipt_ids_unique_within_a_run_b3() {
+        // B3: two retrievals in the SAME run (same date + discriminator) must
+        // get DISTINCT ids so INSERT OR REPLACE can't overwrite the first.
+        let a = Receipt::build(fixed_now(), "run_x", vec![], vec![], vec![], &[], vec![]);
+        let b = Receipt::build(fixed_now(), "run_x", vec![], vec![], vec![], &[], vec![]);
+        assert_ne!(
+            a.receipt_id, b.receipt_id,
+            "same-run receipts must not collide"
+        );
+        assert!(a.receipt_id.starts_with("r_2026_06_22_runx_"));
+        assert!(b.receipt_id.starts_with("r_2026_06_22_runx_"));
    }

    #[test]
--- a/crates/vestige-core/src/trace/review.rs
+++ b/crates/vestige-core/src/trace/review.rs
@ -183,6 +183,11 @@ const SENSITIVE_TOPICS: &[(&str, &str)] = &[
    ("api key", "credential / API key"),
    ("security", "security-relevant fact"),
    ("vuln", "security vulnerability"),
+    ("vulnerability", "security vulnerability"),
+    ("credential", "credential material"),
+    ("credentials", "credential material"),
+    ("api key", "credential / API key"),
+    ("apikey", "credential / API key"),
    // money / bounty / legal
    ("money", "financial fact"),
    ("payment", "financial fact"),
@ -345,21 +350,50 @@ fn collect_signals(ctx: &WriteContext) -> Vec<RiskSignal> {
 }

 /// Return the human label of the first sensitive topic found in content/tags.
+///
+/// B6: matches on WORD BOUNDARIES, not substrings — so "tokenizer" no longer
+/// trips "token", "author" no longer trips "auth", "secretary" no longer trips
+/// "secret". Multi-word needles (e.g. "api key") match a consecutive run of
+/// words. The text is lowercased and split on any non-alphanumeric char.
 fn first_sensitive_topic(content: &str, tags: &[String]) -> Option<&'static str> {
-    let haystack = {
-        let mut s = content.to_ascii_lowercase();
-        for t in tags {
-            s.push(' ');
-            s.push_str(&t.to_ascii_lowercase());
+    // Tokenize content + tags into lowercased alphanumeric words.
+    let mut words: Vec<String> = Vec::new();
+    let mut push_words = |s: &str| {
+        for w in s
+            .to_ascii_lowercase()
+            .split(|c: char| !c.is_ascii_alphanumeric())
+        {
+            if !w.is_empty() {
+                words.push(w.to_string());
+            }
        }
-        s
    };
+    push_words(content);
+    for t in tags {
+        push_words(t);
+    }
+
    SENSITIVE_TOPICS
        .iter()
-        .find(|(needle, _)| haystack.contains(needle))
+        .find(|(needle, _)| matches_word_sequence(&words, needle))
        .map(|(_, label)| *label)
 }

+/// Whether `needle` (one or more space-separated words) appears as a consecutive
+/// whole-word run in `words`.
+fn matches_word_sequence(words: &[String], needle: &str) -> bool {
+    let needle_words: Vec<&str> = needle.split_whitespace().collect();
+    if needle_words.is_empty() {
+        return false;
+    }
+    if needle_words.len() == 1 {
+        return words.iter().any(|w| w == needle_words[0]);
+    }
+    words
+        .windows(needle_words.len())
+        .any(|win| win.iter().zip(&needle_words).all(|(w, n)| w == n))
+}
+
 // ============================================================================
 // MEMORY PR DATA MODEL
 // ============================================================================
@ -490,6 +524,21 @@ impl MemoryPrAction {
            MemoryPrAction::AskAgentWhy => return None,
        })
    }
+
+    /// Whether deciding the PR with this action should **release** the subject
+    /// memory from quarantine (reverse the suppression that gate_writes applied).
+    ///
+    /// A risky write is committed-then-suppressed; approving it must restore its
+    /// retrieval influence, otherwise the UI says "promoted" while the memory
+    /// stays held out — the bug this guards against. Accept actions release;
+    /// `Quarantine` keeps it held; `Forget` rejects it (stays suppressed);
+    /// `AskAgentWhy` is read-only.
+    pub fn releases_memory(&self) -> bool {
+        matches!(
+            self,
+            MemoryPrAction::Promote | MemoryPrAction::Merge | MemoryPrAction::Supersede
+        )
+    }
 }

 /// A reviewable change to the agent's brain — the persisted Memory PR record.
@ -609,6 +658,55 @@ mod tests {
        }
    }

+    #[test]
+    fn sensitive_topic_word_boundary_no_false_positives_b6() {
+        // B6: these ordinary technical writes must NOT gate — they only CONTAIN
+        // a sensitive substring, they don't USE the sensitive word.
+        // These each only CONTAIN a sensitive substring; the word-boundary fix
+        // means they no longer gate. (Note: bare "license"/"contract"/"legal"
+        // ARE kept as gating words — a license/contract fact is legitimately
+        // legal-relevant — so they're intentionally not in this benign set.)
+        for benign in [
+            "The tokenizer converts input strings to embeddings.",
+            "The author of this module is documented in the header.",
+            "The secretary pattern coordinates the worker pool.",
+            "Contraction of the array happens during compaction.",
+            "The authority record links to the canonical node.",
+            "The authentication-free endpoint is for health checks.", // "authentication" != "auth"
+        ] {
+            let mut ctx = ordinary();
+            ctx.content = benign.into();
+            ctx.node_type = "fact".into();
+            ctx.tags = vec![];
+            let (class, _) = classify_write(&ctx, ReviewMode::RiskGated);
+            assert_eq!(
+                class,
+                RiskClass::AutoCommit,
+                "must NOT gate ordinary write: {benign}"
+            );
+        }
+    }
+
+    #[test]
+    fn sensitive_topic_word_boundary_still_catches_real_b6() {
+        // The real sensitive phrasings must still gate.
+        for risky in [
+            "store the auth token for the deploy",
+            "this is a security vulnerability in the parser",
+            "the api key for the service",
+            "remember the user preference for dark mode",
+            "the bounty payout is configured",
+        ] {
+            let mut ctx = ordinary();
+            ctx.content = risky.into();
+            ctx.node_type = "fact".into();
+            ctx.tags = vec![];
+            let (class, signals) = classify_write(&ctx, ReviewMode::RiskGated);
+            assert_eq!(class, RiskClass::Review, "must gate: {risky}");
+            assert!(signals.iter().any(|s| s.code == "sensitive_topic"));
+        }
+    }
+
    #[test]
    fn sensitive_node_type_gates() {
        let mut ctx = ordinary();
@ -689,4 +787,16 @@ mod tests {
        );
        assert_eq!(MemoryPrAction::AskAgentWhy.resulting_status(), None);
    }
+
+    #[test]
+    fn only_accept_actions_release_the_memory() {
+        // B1: accepting a risky write must release it from quarantine.
+        assert!(MemoryPrAction::Promote.releases_memory());
+        assert!(MemoryPrAction::Merge.releases_memory());
+        assert!(MemoryPrAction::Supersede.releases_memory());
+        // Rejecting / holding keeps it suppressed.
+        assert!(!MemoryPrAction::Forget.releases_memory());
+        assert!(!MemoryPrAction::Quarantine.releases_memory());
+        assert!(!MemoryPrAction::AskAgentWhy.releases_memory());
+    }
 }
--- a/crates/vestige-mcp/src/dashboard/handlers.rs
+++ b/crates/vestige-mcp/src/dashboard/handlers.rs
@ -1990,6 +1990,8 @@ pub async fn deep_reference_query(
 #[derive(Debug, Deserialize)]
 pub struct TraceListParams {
    pub limit: Option<usize>,
+    /// Optional run filter — receipts/traces scoped to one run (B5).
+    pub run: Option<String>,
 }

 /// List recent agent runs (newest activity first) for the Black Box run picker.
@ -2083,6 +2085,18 @@ pub async fn export_trace(
        })),
        "events": events,
    });
+    // B7: sanitize the run_id before putting it in the download filename so a
+    // crafted run_id (quotes, path separators, control chars) can't break the
+    // Content-Disposition header or the filename. Falls back to "trace".
+    let safe: String = run_id
+        .chars()
+        .map(|c| if c.is_ascii_alphanumeric() || c == '_' || c == '-' { c } else { '_' })
+        .collect();
+    let safe = if safe.trim_matches('_').is_empty() {
+        "trace".to_string()
+    } else {
+        safe
+    };
    let headers = [
        (
            axum::http::header::CONTENT_TYPE,
@ -2090,7 +2104,7 @@ pub async fn export_trace(
        ),
        (
            axum::http::header::CONTENT_DISPOSITION,
-            format!("attachment; filename=\"{run_id}.vestige-trace.json\""),
+            format!("attachment; filename=\"{safe}.vestige-trace.json\""),
        ),
    ];
    Ok((headers, Json(body)))
@ -2106,10 +2120,13 @@ pub async fn list_receipts(
    Query(params): Query<TraceListParams>,
 ) -> Result<Json<Value>, StatusCode> {
    let limit = params.limit.unwrap_or(50).clamp(1, 500);
-    let receipts = state
-        .storage
-        .list_receipts(limit)
-        .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
+    // B5: when a run is given, scope to that run's receipts so the Black Box
+    // panel shows only receipts that actually belong to the selected run.
+    let receipts = match params.run.as_deref().filter(|r| !r.is_empty()) {
+        Some(run_id) => state.storage.list_receipts_for_run(run_id, limit),
+        None => state.storage.list_receipts(limit),
+    }
+    .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
    Ok(Json(serde_json::json!({
        "total": receipts.len(),
        "receipts": receipts,
@ -2207,6 +2224,39 @@ pub async fn act_on_memory_pr(
        .decide_memory_pr(&id, action)
        .map_err(|_| StatusCode::NOT_FOUND)?;

+    // B1: an accept action (promote/merge/supersede) must RELEASE the subject
+    // memory from quarantine — gate_writes suppressed it, so deciding the PR
+    // without un-suppressing would leave it "promoted" yet still held out of
+    // retrieval. Forget/Quarantine intentionally keep it suppressed.
+    let mut released = false;
+    if action.releases_memory()
+        && let Some(subject_id) = decided.subject_id.as_deref()
+    {
+        use vestige_core::neuroscience::active_forgetting::ActiveForgettingSystem;
+        let labile_hours = ActiveForgettingSystem::new().labile_hours;
+        match state.storage.reverse_suppression(subject_id, labile_hours) {
+            Ok(node) => {
+                released = true;
+                state.emit(VestigeEvent::MemoryUnsuppressed {
+                    id: node.id.clone(),
+                    remaining_count: node.suppression_count,
+                    timestamp: Utc::now(),
+                });
+            }
+            Err(e) => {
+                // Best-effort: the PR is decided regardless, but surface the
+                // failure so a stuck-suppressed memory isn't silent.
+                tracing::warn!(
+                    "memory PR {} {}d but failed to release subject {}: {}",
+                    id,
+                    action_label(action),
+                    subject_id,
+                    e
+                );
+            }
+        }
+    }
+
    state.emit(VestigeEvent::MemoryPrDecided {
        id: decided.id.clone(),
        decision: decided
@ -2218,7 +2268,24 @@ pub async fn act_on_memory_pr(
        timestamp: Utc::now(),
    });

-    Ok(Json(serde_json::to_value(&decided).unwrap_or_default()))
+    let mut out = serde_json::to_value(&decided).unwrap_or_default();
+    if let Some(obj) = out.as_object_mut() {
+        obj.insert("subjectReleased".to_string(), serde_json::json!(released));
+    }
+    Ok(Json(out))
+}
+
+/// Short label for a Memory PR action, for log lines.
+fn action_label(action: vestige_core::MemoryPrAction) -> &'static str {
+    use vestige_core::MemoryPrAction::*;
+    match action {
+        Promote => "promote",
+        Merge => "merge",
+        Supersede => "supersede",
+        Quarantine => "quarantine",
+        Forget => "forget",
+        AskAgentWhy => "ask_agent_why",
+    }
 }

 #[derive(Debug, Deserialize)]
@ -2244,8 +2311,10 @@ pub async fn set_review_mode(
    let mode = vestige_core::ReviewMode::from_label(&body.mode);
    let path = review_mode_path(&state);
    let payload = serde_json::json!({ "mode": mode.as_str() });
-    fs::write(&path, serde_json::to_vec_pretty(&payload).unwrap_or_default())
-        .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
+    // B7: atomic write (temp + rename) so a concurrent read can never see a
+    // partially-written / corrupt review_mode.json, reusing the same helper the
+    // Sanhedrin receipt path uses.
+    write_atomic(&path, &serde_json::to_vec_pretty(&payload).unwrap_or_default())?;
    Ok(Json(serde_json::json!({ "mode": mode.as_str() })))
 }

--- a/crates/vestige-mcp/src/dashboard/mod.rs
+++ b/crates/vestige-mcp/src/dashboard/mod.rs
@ -198,13 +198,17 @@ fn build_router_inner(state: AppState, port: u16) -> (Router, AppState) {
        // MEMORY PRs (v2.2) — risk-gated brain-change review queue
        // ============================================================
        .route("/api/memory-prs", get(handlers::list_memory_prs))
+        // Static `/mode` routes declared BEFORE the dynamic `/{id}` route (B7
+        // hygiene). axum 0.8/matchit already prioritizes static segments, but
+        // declaring them first makes the intent unambiguous and guards against
+        // a future router that doesn't.
+        .route("/api/memory-prs/mode", get(handlers::get_review_mode))
+        .route("/api/memory-prs/mode", post(handlers::set_review_mode))
        .route("/api/memory-prs/{id}", get(handlers::get_memory_pr))
        .route(
            "/api/memory-prs/{id}/{action}",
            post(handlers::act_on_memory_pr),
        )
-        .route("/api/memory-prs/mode", get(handlers::get_review_mode))
-        .route("/api/memory-prs/mode", post(handlers::set_review_mode))
        .layer(
            ServiceBuilder::new()
                .concurrency_limit(50)
--- a/crates/vestige-mcp/src/trace_recorder.rs
+++ b/crates/vestige-mcp/src/trace_recorder.rs
@ -29,10 +29,45 @@ use vestige_core::{
 };

 /// Tools that write to memory and are therefore subject to risk-gated review.
+///
+/// Includes `codebase` (its `remember_pattern` / `remember_decision` actions
+/// write durable architectural-decision memories) so those brain mutations are
+/// traced and gated like any other write (B2). Read-only actions on these tools
+/// are filtered out downstream by [`is_write_decision`].
 fn is_write_tool(tool: &str) -> bool {
    matches!(
        tool,
-        "smart_ingest" | "ingest" | "session_checkpoint" | "memory"
+        "smart_ingest" | "ingest" | "session_checkpoint" | "memory" | "codebase"
+    )
+}
+
+/// Whether a tool's `decision`/`action` label denotes an actual memory write
+/// (vs. a read like `get`/`state`). Used to keep reads out of the write trace.
+fn is_write_decision(label: &str) -> bool {
+    matches!(
+        label,
+        "create"
+            | "created"
+            | "update"
+            | "updated"
+            | "supersede"
+            | "superseded"
+            | "reinforce"
+            | "reinforced"
+            | "merge"
+            | "merged"
+            | "replace"
+            | "replaced"
+            | "add_context"
+            | "edit"
+            | "edited"
+            | "promote"
+            | "promoted"
+            | "demote"
+            | "demoted"
+            | "remember_pattern"
+            | "remember_decision"
+            | "remembered"
    )
 }

@ -529,13 +564,21 @@ fn parse_suppress_reason(s: &str) -> SuppressReason {
 fn extract_writes(result: &Value) -> Vec<(String, String)> {
    let mut out = Vec::new();
    let push = |out: &mut Vec<(String, String)>, item: &Value| {
-        let decision = item.get("decision").and_then(|v| v.as_str());
+        // B2: accept either `decision` (smart_ingest) or `action`
+        // (memory promote/demote/edit, codebase remember_*). Read-only labels
+        // (get/state/...) are filtered out so reads never trace as writes.
+        let label = item
+            .get("decision")
+            .or_else(|| item.get("action"))
+            .and_then(|v| v.as_str());
        let id = item
            .get("nodeId")
            .or_else(|| item.get("id"))
            .and_then(|v| v.as_str());
-        if let (Some(d), Some(id)) = (decision, id) {
-            out.push((id.to_string(), d.to_string()));
+        if let (Some(label), Some(id)) = (label, id)
+            && is_write_decision(label)
+        {
+            out.push((id.to_string(), label.to_string()));
        }
    };
    push(&mut out, result);
@ -766,4 +809,36 @@ mod tests {
        });
        assert_eq!(extract_writes(&batch), vec![("n2".into(), "update".into())]);
    }
+
+    #[test]
+    fn extract_writes_recognizes_action_shape_b2() {
+        // B2: memory promote/demote return `action` + `nodeId`, not `decision`.
+        let promoted = serde_json::json!({ "action": "promoted", "nodeId": "m1" });
+        assert_eq!(extract_writes(&promoted), vec![("m1".into(), "promoted".into())]);
+        let demoted = serde_json::json!({ "action": "demoted", "nodeId": "m2" });
+        assert_eq!(extract_writes(&demoted), vec![("m2".into(), "demoted".into())]);
+        // codebase remember_decision returns action + nodeId.
+        let decision = serde_json::json!({ "action": "remember_decision", "nodeId": "c1" });
+        assert_eq!(
+            extract_writes(&decision),
+            vec![("c1".into(), "remember_decision".into())]
+        );
+    }
+
+    #[test]
+    fn extract_writes_ignores_read_actions_b2() {
+        // A read (memory get / get_batch / state) carries nodeId but is NOT a write.
+        let read = serde_json::json!({ "action": "get", "nodeId": "m1" });
+        assert!(extract_writes(&read).is_empty(), "get is not a write");
+        let state = serde_json::json!({ "action": "state", "nodeId": "m2" });
+        assert!(extract_writes(&state).is_empty(), "state is not a write");
+    }
+
+    #[test]
+    fn write_tool_set_includes_codebase_b2() {
+        assert!(is_write_tool("codebase"));
+        assert!(is_write_tool("memory"));
+        assert!(!is_write_tool("search"));
+        assert!(!is_write_tool("deep_reference"));
+    }
 }