From b6aeb061f4e8c3966bc50d79f048a5ef90ee4184 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 20 May 2026 14:24:09 +0000
Subject: [PATCH 1/4] Wire live synapse graph into L3 retrieval ranking

L3 search ranked results via vector similarity plus a separate static
learned_patterns.json reranker; the Hebbian synapse store was written to
on every query but never consulted during retrieval, and synaptic recall
only reached the UserPromptSubmit hook (never the MCP/programmatic query
path).

Seed spreading activation from the top L3 hits and boost any other result
the synapse graph co-activates, so learned association shapes ranking for
every retrieval consumer. Behind the existing NEURALMIND_SYNAPSE_INJECT
switch and a no-op on a cold graph, so cold-start output is byte-identical.

https://claude.ai/code/session_01DRbKLVDX9PNyNdXwuNqTDp
---
 neuralmind/context_selector.py |  65 +++++++++++++++-
 neuralmind/core.py             |  20 +++++
 tests/test_context_selector.py | 135 +++++++++++++++++++++++++++++++++
 3 files changed, 218 insertions(+), 2 deletions(-)

diff --git a/neuralmind/context_selector.py b/neuralmind/context_selector.py
index b203f71..69a8101 100644
--- a/neuralmind/context_selector.py
+++ b/neuralmind/context_selector.py
@@ -18,6 +18,7 @@
 - Reduction ratio: 30-50x typical
 """
 
+import os
 from dataclasses import dataclass, field
 from pathlib import Path
 
@@ -90,6 +91,12 @@ class ContextSelector:
     # Chars per token estimate
     CHARS_PER_TOKEN = 4
 
+    # Synapse-driven recall (see _apply_synapse_boost): number of top hits used
+    # to seed spreading activation, and how strongly learned co-activation
+    # nudges a result's relevance score.
+    SYNAPSE_SEED_K = 3
+    SYNAPSE_BOOST_WEIGHT = 0.3
+
     def __init__(self, embedder, project_path: str = None, enable_reranking: bool = True):
         """
         Initialize context selector.
@@ -119,6 +126,12 @@ def __init__(self, embedder, project_path: str = None, enable_reranking: bool =
         self._reranker: SemanticReranker | None = None
         self._context_modules: list[str] = []
 
+        # Optional seed-based synapse recall, injected by NeuralMind.build().
+        # Signature: (seed_node_ids: list[str]) -> list[tuple[node_id, energy]].
+        # Left None here so a selector built without a synapse store (or on a
+        # cold graph) behaves exactly as it did before this layer existed.
+        self.synapse_recall = None
+
         # Cache for layer content
         self._l0_cache: str | None = None
         self._l1_cache: str | None = None
@@ -375,6 +388,46 @@ def get_l2_context(self, query: str, max_communities: int = 3) -> tuple[str, lis
         context = self._truncate_to_tokens("\n".join(parts), self.L2_MAX_TOKENS)
         return context, loaded_communities
 
+    def _apply_synapse_boost(self, results: list[dict]) -> list[dict]:
+        """Re-rank L3 hits using learned synapse co-activation.
+
+        Seeds spreading activation from the top hits, then boosts any other
+        result the synapse graph activates — surfacing nodes the agent keeps
+        using together even when pure vector similarity ranks them lower.
+
+        No-op (returns ``results`` unchanged) when recall isn't wired, the
+        kill switch is set, or the graph is cold — so cold-start behavior is
+        byte-identical to a build without a synapse store.
+        """
+        if not self.synapse_recall or os.environ.get("NEURALMIND_SYNAPSE_INJECT") == "0":
+            return results
+
+        seeds = [r["id"] for r in results[: self.SYNAPSE_SEED_K] if r.get("id")]
+        if not seeds:
+            return results
+
+        try:
+            energy = dict(self.synapse_recall(seeds))
+        except Exception:
+            return results
+        if not energy:
+            return results
+
+        seed_set = set(seeds)
+        boosted = False
+        for r in results:
+            nid = r.get("id")
+            if nid in seed_set or nid not in energy:
+                continue
+            boost = self.SYNAPSE_BOOST_WEIGHT * energy[nid]
+            r["score"] = r.get("score", 0.0) + boost
+            r["_synapse_boost"] = boost
+            boosted = True
+
+        if boosted:
+            results = sorted(results, key=lambda r: r.get("score", 0.0), reverse=True)
+        return results
+
     def get_l3_search(self, query: str, n: int = 4) -> tuple[str, int]:
         """
         Layer 3: Deep semantic search results.
@@ -394,18 +447,26 @@ def get_l3_search(self, query: str, n: int = 4) -> tuple[str, int]:
             if reranker.enabled:
                 results = reranker.rerank(results, context_modules=self._context_modules)
 
+        # Fold in the live synapse graph: results the agent has historically
+        # co-activated with this query's top hits get a relevance nudge, so
+        # learned association — not just vector similarity — shapes ranking.
+        results = self._apply_synapse_boost(results)
+
         parts = ["## Search Results", ""]
 
         for i, result in enumerate(results, 1):
             meta = result.get("metadata", {})
             score = result.get("score", 0)
             boost = result.get("_reranker_boost", 0.0)
+            synapse = result.get("_synapse_boost", 0.0)
 
-            # Show boost in label if applied
+            # Show boosts in label if applied
             boost_label = f" (+{boost:.2f} boost)" if boost > 0 else ""
+            synapse_label = f" (+{synapse:.2f} synapse)" if synapse > 0 else ""
 
             parts.append(
-                f"{i}. **{meta.get('label', 'unknown')}** (score: {score:.2f}{boost_label})"
+                f"{i}. **{meta.get('label', 'unknown')}** "
+                f"(score: {score:.2f}{boost_label}{synapse_label})"
             )
             parts.append(f"   Type: {meta.get('file_type', 'unknown')}")
             parts.append(f"   File: {meta.get('source_file', 'unknown')}")
diff --git a/neuralmind/core.py b/neuralmind/core.py
index 5b30862..ab65d28 100644
--- a/neuralmind/core.py
+++ b/neuralmind/core.py
@@ -203,6 +203,9 @@ def build(self, force: bool = False) -> dict:
         self.selector = ContextSelector(
             self.embedder, str(self.project_path), enable_reranking=self.enable_reranking
         )
+        # Let L3 retrieval consult the live synapse graph (seed-based spread,
+        # no extra embedder round trip — the seeds are hits already fetched).
+        self.selector.synapse_recall = self._recall_for_selection
 
         # Get final stats
         final_stats = self.embedder.get_stats()
@@ -772,6 +775,23 @@ def graph_data(self, synapse_min_weight: float = 0.05, synapse_limit: int = 2000
             },
         }
 
+    def _recall_for_selection(
+        self, seed_ids: list[str], depth: int = 2, top_k: int = 8
+    ) -> list[tuple[str, float]]:
+        """Seed-based spreading activation for the context selector.
+
+        Takes node ids the selector already fetched (so no second embedder
+        round trip) and returns their learned synapse neighbors. Empty on a
+        cold graph or when synapses are unavailable.
+        """
+        store = self.synapses
+        if store is None or not seed_ids:
+            return []
+        try:
+            return store.spread(seed_ids, depth=depth, top_k=top_k)
+        except Exception:
+            return []
+
     def synaptic_neighbors(
         self, query: str, depth: int = 2, top_k: int = 10
     ) -> list[tuple[str, float]]:
diff --git a/tests/test_context_selector.py b/tests/test_context_selector.py
index e9240f5..20b3977 100644
--- a/tests/test_context_selector.py
+++ b/tests/test_context_selector.py
@@ -723,3 +723,138 @@ def test_reranking_preserves_result_count(self, mock_embedder, temp_project):
 
         # Should respect n parameter even after reranking
         assert hits <= 3
+
+
+class TestSynapseBoost:
+    """L3 retrieval consults the live synapse graph (seed-based spread)."""
+
+    @staticmethod
+    def _four_hit_embedder(mock_embedder):
+        """Override the mock so search returns four ordered, distinct hits.
+
+        With the default SYNAPSE_SEED_K=3 the top three are spread seeds
+        (and seeds are excluded from boosting), so ``node_low`` is the only
+        result eligible for a synapse boost.
+        """
+        mock_embedder.search.return_value = [
+            {
+                "id": "node_top",
+                "document": "top hit",
+                "metadata": {"label": "top", "file_type": "function", "community": 1},
+                "distance": 0.10,
+                "score": 0.90,
+            },
+            {
+                "id": "node_mid",
+                "document": "middle hit",
+                "metadata": {"label": "mid", "file_type": "function", "community": 1},
+                "distance": 0.40,
+                "score": 0.60,
+            },
+            {
+                "id": "node_seed3",
+                "document": "third seed hit",
+                "metadata": {"label": "seed3", "file_type": "function", "community": 1},
+                "distance": 0.45,
+                "score": 0.55,
+            },
+            {
+                "id": "node_low",
+                "document": "low hit",
+                "metadata": {"label": "low", "file_type": "function", "community": 2},
+                "distance": 0.50,
+                "score": 0.50,
+            },
+        ]
+        return mock_embedder
+
+    def test_boost_promotes_associated_hit(self, mock_embedder, temp_project):
+        """A strongly co-activated lower hit is reordered above higher ones."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        # node_low (0.50) is the learned neighbor of the seeds; a 0.3 * 1.0
+        # boost lifts it to 0.80, above node_mid (0.60) and node_seed3 (0.55).
+        selector.synapse_recall = lambda seeds: [("node_low", 1.0)]
+
+        text, hits = selector.get_l3_search("query", n=4)
+
+        assert hits == 4
+        # node_low should now outrank node_mid in the rendered output.
+        assert text.index("**low**") < text.index("**mid**")
+        assert "synapse" in text
+
+    def test_seeds_are_passed_from_top_hits(self, mock_embedder, temp_project):
+        """Spread is seeded from the top SYNAPSE_SEED_K hit ids, not the tail."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        captured = {}
+
+        def recall(seeds):
+            captured["seeds"] = list(seeds)
+            return []
+
+        selector.synapse_recall = recall
+        selector.get_l3_search("query", n=4)
+
+        assert captured["seeds"] == ["node_top", "node_mid", "node_seed3"]
+
+    def test_no_recall_is_noop(self, mock_embedder, temp_project):
+        """Without a recall callable, ordering and labels are unchanged."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        # synapse_recall defaults to None.
+
+        text, _ = selector.get_l3_search("query", n=4)
+
+        assert text.index("**top**") < text.index("**mid**") < text.index("**low**")
+        assert "synapse" not in text
+
+    def test_cold_graph_is_noop(self, mock_embedder, temp_project):
+        """Empty recall (cold graph) leaves results byte-identical."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        selector.synapse_recall = lambda seeds: []
+
+        text, _ = selector.get_l3_search("query", n=4)
+
+        assert text.index("**top**") < text.index("**mid**") < text.index("**low**")
+        assert "synapse" not in text
+
+    def test_kill_switch_disables_boost(self, mock_embedder, temp_project, monkeypatch):
+        """NEURALMIND_SYNAPSE_INJECT=0 turns the boost off even when wired."""
+        from neuralmind.context_selector import ContextSelector
+
+        monkeypatch.setenv("NEURALMIND_SYNAPSE_INJECT", "0")
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        selector.synapse_recall = lambda seeds: [("node_low", 1.0)]
+
+        text, _ = selector.get_l3_search("query", n=4)
+
+        assert text.index("**top**") < text.index("**mid**") < text.index("**low**")
+        assert "synapse" not in text
+
+    def test_recall_exception_is_swallowed(self, mock_embedder, temp_project):
+        """A failing recall callable must not break retrieval."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+
+        def boom(seeds):
+            raise RuntimeError("synapse store unavailable")
+
+        selector.synapse_recall = boom
+
+        text, hits = selector.get_l3_search("query", n=4)
+
+        assert hits == 4
+        assert text.index("**top**") < text.index("**mid**") < text.index("**low**")

From 6d4a1056e07ed4517f481b0a759f30d70d885fa5 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 20 May 2026 15:18:08 +0000
Subject: [PATCH 2/4] Extend synapse recall into L2/L3 selection,
 budget-neutral
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

PR1 wired the synapse graph into L3 reranking. This extends it so learned
co-activation also surfaces context the agent missed — without spending
extra tokens:

- L3: swap the weakest vector hits for the strongest absent neighbors
  (displacement, result count fixed) instead of appending them.
- L2: a co-activated community can win a slot by outscoring a vector one,
  but cannot grow how many communities load past what vector search alone
  surfaced.

Adds GraphEmbedder.get_nodes_by_ids to fetch recalled neighbors. All
behind NEURALMIND_SYNAPSE_INJECT and a no-op on a cold graph. Fixture demo
holds at ~6x reduction warm and cold (was 4.8x with an additive draft).

https://claude.ai/code/session_01DRbKLVDX9PNyNdXwuNqTDp
---
 neuralmind/context_selector.py | 119 ++++++++++++++++++++----
 neuralmind/embedder.py         |  27 ++++++
 tests/test_context_selector.py | 161 +++++++++++++++++++++++++++++++++
 3 files changed, 289 insertions(+), 18 deletions(-)

diff --git a/neuralmind/context_selector.py b/neuralmind/context_selector.py
index 69a8101..6073c87 100644
--- a/neuralmind/context_selector.py
+++ b/neuralmind/context_selector.py
@@ -91,11 +91,15 @@ class ContextSelector:
     # Chars per token estimate
     CHARS_PER_TOKEN = 4
 
-    # Synapse-driven recall (see _apply_synapse_boost): number of top hits used
-    # to seed spreading activation, and how strongly learned co-activation
-    # nudges a result's relevance score.
+    # Synapse-driven recall (see _apply_synapse_boost / get_l2_context):
+    # number of top hits used to seed spreading activation, how strongly
+    # learned co-activation nudges relevance, the cap on neighbors pulled
+    # into L3 that vector search missed, and the minimum activation an
+    # absent neighbor needs before it's worth pulling in.
     SYNAPSE_SEED_K = 3
     SYNAPSE_BOOST_WEIGHT = 0.3
+    SYNAPSE_PULL_IN_MAX = 2
+    SYNAPSE_PULL_IN_MIN_ENERGY = 0.15
 
     def __init__(self, embedder, project_path: str = None, enable_reranking: bool = True):
         """
@@ -355,9 +359,20 @@ def get_l2_context(self, query: str, max_communities: int = 3) -> tuple[str, lis
             if comm >= 0:
                 community_scores[comm] = community_scores.get(comm, 0) + score
 
+        # Pull communities the agent has historically co-activated with these
+        # hits into contention, even when this query's vector matches alone
+        # wouldn't have surfaced them. Reinforcement records community_<id>
+        # pseudo-nodes, so spreading activation can return them directly.
+        # Budget-neutral: a co-activated community can win a slot by
+        # outscoring a vector one, but it can't grow how many we load — the
+        # cap stays at what vector search alone would have surfaced.
+        vector_community_count = len(community_scores)
+        self._boost_communities_from_synapses(search_results, community_scores)
+        community_budget = min(max_communities, vector_community_count)
+
         # Get top communities
         top_communities = sorted(community_scores.items(), key=lambda x: x[1], reverse=True)[
-            :max_communities
+            :community_budget
         ]
 
         if not top_communities:
@@ -388,32 +403,67 @@ def get_l2_context(self, query: str, max_communities: int = 3) -> tuple[str, lis
         context = self._truncate_to_tokens("\n".join(parts), self.L2_MAX_TOKENS)
         return context, loaded_communities
 
+    def _synapse_disabled(self) -> bool:
+        """True when synapse recall isn't wired or the kill switch is set."""
+        return not self.synapse_recall or os.environ.get("NEURALMIND_SYNAPSE_INJECT") == "0"
+
+    def _recall_energy(self, seeds: list[str]) -> dict[str, float]:
+        """Spread from ``seeds`` and return {node_id: activation}, or {}."""
+        if not seeds:
+            return {}
+        try:
+            return dict(self.synapse_recall(seeds))
+        except Exception:
+            return {}
+
+    def _boost_communities_from_synapses(
+        self, search_results: list[dict], community_scores: dict[int, float]
+    ) -> None:
+        """Add co-activated communities' energy into ``community_scores``.
+
+        Mutates ``community_scores`` in place. No-op when recall is disabled
+        or the graph is cold, so cold-start L2 selection is unchanged.
+        """
+        if self._synapse_disabled():
+            return
+        seeds = [r["id"] for r in search_results[: self.SYNAPSE_SEED_K] if r.get("id")]
+        for node_id, energy in self._recall_energy(seeds).items():
+            if not node_id.startswith("community_"):
+                continue
+            try:
+                comm = int(node_id[len("community_") :])
+            except ValueError:
+                continue
+            community_scores[comm] = (
+                community_scores.get(comm, 0.0) + energy * self.SYNAPSE_BOOST_WEIGHT
+            )
+
     def _apply_synapse_boost(self, results: list[dict]) -> list[dict]:
         """Re-rank L3 hits using learned synapse co-activation.
 
-        Seeds spreading activation from the top hits, then boosts any other
-        result the synapse graph activates — surfacing nodes the agent keeps
-        using together even when pure vector similarity ranks them lower.
+        Budget-neutral: never grows the result count. Seeds spreading
+        activation from the top hits, then (a) boosts and reorders results
+        the graph activates and (b) swaps the weakest vector hits for
+        strongly co-activated neighbors vector search missed — surfacing
+        nodes the agent keeps using together without spending extra tokens.
 
         No-op (returns ``results`` unchanged) when recall isn't wired, the
         kill switch is set, or the graph is cold — so cold-start behavior is
         byte-identical to a build without a synapse store.
         """
-        if not self.synapse_recall or os.environ.get("NEURALMIND_SYNAPSE_INJECT") == "0":
+        if self._synapse_disabled():
             return results
 
         seeds = [r["id"] for r in results[: self.SYNAPSE_SEED_K] if r.get("id")]
-        if not seeds:
-            return results
-
-        try:
-            energy = dict(self.synapse_recall(seeds))
-        except Exception:
-            return results
+        energy = self._recall_energy(seeds)
         if not energy:
             return results
 
         seed_set = set(seeds)
+        present = {r.get("id") for r in results}
+
+        # (a) Boost results already present that the graph co-activates,
+        #     then reorder by score. Token-neutral (same nodes).
         boosted = False
         for r in results:
             nid = r.get("id")
@@ -423,10 +473,42 @@ def _apply_synapse_boost(self, results: list[dict]) -> list[dict]:
             r["score"] = r.get("score", 0.0) + boost
             r["_synapse_boost"] = boost
             boosted = True
-
         if boosted:
             results = sorted(results, key=lambda r: r.get("score", 0.0), reverse=True)
-        return results
+
+        # (b) Swap the weakest vector hits for the strongest absent neighbors.
+        #     Displacement keeps the result count fixed, so the token budget
+        #     is unchanged — we trade the least-relevant hits, not add to them.
+        candidates = sorted(
+            (
+                (nid, e)
+                for nid, e in energy.items()
+                if nid not in present
+                and not nid.startswith("community_")
+                and e >= self.SYNAPSE_PULL_IN_MIN_ENERGY
+            ),
+            key=lambda x: x[1],
+            reverse=True,
+        )[: self.SYNAPSE_PULL_IN_MAX]
+        if not candidates:
+            return results
+
+        # Keep at least one vector hit; only displace as many as we can fetch.
+        num_swap = min(len(candidates), max(0, len(results) - 1))
+        if num_swap <= 0:
+            return results
+        energy_by_id = dict(candidates[:num_swap])
+        fetched = self.embedder.get_nodes_by_ids(list(energy_by_id))
+        if not fetched:
+            return results
+
+        kept = results[: len(results) - len(fetched)]
+        for node in fetched:
+            boost = self.SYNAPSE_BOOST_WEIGHT * energy_by_id.get(node.get("id"), 0.0)
+            node["score"] = boost
+            node["_synapse_boost"] = boost
+            node["_synapse_recalled"] = True
+        return kept + fetched
 
     def get_l3_search(self, query: str, n: int = 4) -> tuple[str, int]:
         """
@@ -463,9 +545,10 @@ def get_l3_search(self, query: str, n: int = 4) -> tuple[str, int]:
             # Show boosts in label if applied
             boost_label = f" (+{boost:.2f} boost)" if boost > 0 else ""
             synapse_label = f" (+{synapse:.2f} synapse)" if synapse > 0 else ""
+            recalled_label = " [recalled]" if result.get("_synapse_recalled") else ""
 
             parts.append(
-                f"{i}. **{meta.get('label', 'unknown')}** "
+                f"{i}. **{meta.get('label', 'unknown')}**{recalled_label} "
                 f"(score: {score:.2f}{boost_label}{synapse_label})"
             )
             parts.append(f"   Type: {meta.get('file_type', 'unknown')}")
diff --git a/neuralmind/embedder.py b/neuralmind/embedder.py
index 436802b..e4fbb53 100644
--- a/neuralmind/embedder.py
+++ b/neuralmind/embedder.py
@@ -357,6 +357,33 @@ def get_file_edges(self, source_file: str, node_ids: set[str] | None = None) ->
             )
         ]
 
+    def get_nodes_by_ids(self, node_ids: list[str]) -> list[dict]:
+        """Fetch indexed nodes by id, shaped like ``search`` results.
+
+        Used to pull synapse-recalled neighbors into L3 even when vector
+        search didn't surface them. Missing ids are skipped; ``score`` is
+        omitted (callers supply their own relevance for appended nodes).
+        """
+        if not node_ids:
+            return []
+        try:
+            fetched = self.collection.get(ids=list(node_ids), include=["documents", "metadatas"])
+        except Exception:
+            return []
+        out = []
+        ids = fetched.get("ids") or []
+        docs = fetched.get("documents") or []
+        metas = fetched.get("metadatas") or []
+        for i, node_id in enumerate(ids):
+            out.append(
+                {
+                    "id": node_id,
+                    "document": docs[i] if i < len(docs) else "",
+                    "metadata": metas[i] if i < len(metas) else {},
+                }
+            )
+        return out
+
     def get_community_summary(self, community_id: int, max_nodes: int = 20) -> dict:
         """
         Get a summary of nodes in a community for context injection.
diff --git a/tests/test_context_selector.py b/tests/test_context_selector.py
index 20b3977..696f544 100644
--- a/tests/test_context_selector.py
+++ b/tests/test_context_selector.py
@@ -858,3 +858,164 @@ def boom(seeds):
 
         assert hits == 4
         assert text.index("**top**") < text.index("**mid**") < text.index("**low**")
+
+    def test_pulls_in_absent_neighbor_budget_neutral(self, mock_embedder, temp_project):
+        """A co-activated absent node displaces the weakest hit, count fixed."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        mock_embedder.get_nodes_by_ids.return_value = [
+            {
+                "id": "node_absent",
+                "document": "recalled function",
+                "metadata": {
+                    "label": "recalled_fn",
+                    "file_type": "function",
+                    "source_file": "assoc.py",
+                },
+            }
+        ]
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        selector.synapse_recall = lambda seeds: [("node_absent", 1.0)]
+
+        text, hits = selector.get_l3_search("query", n=4)
+
+        # Count unchanged: recalled_fn entered, the weakest hit ("low") left.
+        assert hits == 4
+        assert "recalled_fn" in text
+        assert "[recalled]" in text
+        assert "**low**" not in text
+        mock_embedder.get_nodes_by_ids.assert_called_once_with(["node_absent"])
+
+    def test_pull_in_respects_energy_threshold(self, mock_embedder, temp_project):
+        """A weakly co-activated absent node is not pulled in."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        # Below SYNAPSE_PULL_IN_MIN_ENERGY (0.15).
+        selector.synapse_recall = lambda seeds: [("node_absent", 0.05)]
+
+        text, hits = selector.get_l3_search("query", n=4)
+
+        assert hits == 4
+        assert "[recalled]" not in text
+        mock_embedder.get_nodes_by_ids.assert_not_called()
+
+    def test_pull_in_respects_max_cap(self, mock_embedder, temp_project):
+        """No more than SYNAPSE_PULL_IN_MAX neighbors are pulled in."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        captured = {}
+
+        def get_nodes_by_ids(ids):
+            captured["ids"] = list(ids)
+            return [
+                {"id": i, "document": i, "metadata": {"label": i, "file_type": "function"}}
+                for i in ids
+            ]
+
+        mock_embedder.get_nodes_by_ids.side_effect = get_nodes_by_ids
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        selector.synapse_recall = lambda seeds: [
+            ("absent_a", 0.9),
+            ("absent_b", 0.8),
+            ("absent_c", 0.7),
+        ]
+
+        _, hits = selector.get_l3_search("query", n=4)
+
+        # Count stays 4: two weakest hits displaced by the two highest-energy
+        # neighbors (cap), absent_c left out by SYNAPSE_PULL_IN_MAX.
+        assert hits == 4
+        assert captured["ids"] == ["absent_a", "absent_b"]
+
+    def test_community_pseudo_node_not_pulled_into_l3(self, mock_embedder, temp_project):
+        """community_<id> recall nodes feed L2, never get fetched as L3 nodes."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        selector.synapse_recall = lambda seeds: [("community_9", 1.0)]
+
+        _, hits = selector.get_l3_search("query", n=4)
+
+        assert hits == 4
+        mock_embedder.get_nodes_by_ids.assert_not_called()
+
+
+class TestSynapseCommunityBoost:
+    """L2 community selection consults the synapse graph, budget-neutral (PR2)."""
+
+    @staticmethod
+    def _two_community_embedder(mock_embedder):
+        """Vector hits across a strong community (1) and a weak one (2)."""
+        mock_embedder.search.return_value = [
+            {
+                "id": "hit_a",
+                "document": "strong",
+                "metadata": {"label": "a", "file_type": "function", "community": 1},
+                "distance": 0.1,
+                "score": 0.90,
+            },
+            {
+                "id": "hit_b",
+                "document": "weak",
+                "metadata": {"label": "b", "file_type": "function", "community": 2},
+                "distance": 0.9,
+                "score": 0.10,
+            },
+        ]
+        return mock_embedder
+
+    def test_recalled_community_displaces_weaker(self, mock_embedder, temp_project):
+        """A co-activated community wins a slot from a weaker vector one."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._two_community_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        # community_9: score 1.0 * 0.3 = 0.30 > community 2's 0.10.
+        selector.synapse_recall = lambda seeds: [("community_9", 1.0)]
+
+        _, communities = selector.get_l2_context("query")
+
+        # Count unchanged (2): 9 entered, the weaker community 2 dropped out.
+        assert len(communities) == 2
+        assert 9 in communities
+        assert 2 not in communities
+
+    def test_recall_cannot_grow_community_count(self, mock_embedder, temp_project):
+        """When vector finds one community, recall can't add a second slot."""
+        from neuralmind.context_selector import ContextSelector
+
+        # Default mock: two hits, both community 1 -> one vector community.
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        selector.synapse_recall = lambda seeds: [("community_9", 1.0)]
+
+        _, communities = selector.get_l2_context("query")
+
+        assert len(communities) == 1
+
+    def test_no_recall_leaves_communities_unchanged(self, mock_embedder, temp_project):
+        """Without recall, only vector-hit communities are loaded."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._two_community_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+
+        _, communities = selector.get_l2_context("query")
+
+        assert set(communities) == {1, 2}
+
+    def test_malformed_community_node_ignored(self, mock_embedder, temp_project):
+        """A non-integer community_<x> recall id is skipped, not fatal."""
+        from neuralmind.context_selector import ContextSelector
+
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        selector.synapse_recall = lambda seeds: [("community_abc", 1.0)]
+
+        # Should not raise; community list is just the vector-hit ones.
+        _, communities = selector.get_l2_context("query")
+
+        assert isinstance(communities, list)

From 20d49767b5f44af898b428533b63b53a0bf209e5 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 20 May 2026 15:32:25 +0000
Subject: [PATCH 3/4] Add synapse recall A/B to the self-benchmark
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Phase 2 measures the learned_patterns reranker; nothing isolated the
Hebbian synapse layer's effect on retrieval quality. Add Phase 3: reinforce
realistic co-editing sessions, then measure the same query set with synapse
recall off vs on (same warm graph, only NEURALMIND_SYNAPSE_INJECT differs).

On the fixture, recall lifts top-k hit rate 72% -> 83% (+12 points) while
the reduction ratio holds at 6.1x -> 6.1x — associative recall surfaces
co-edited modules a textual search ranks lower, at no token cost.

Two regression gates: recall must never lower hit rate (catches budget-
neutral displacement dropping a relevant hit) and reduction must stay
budget-neutral.

https://claude.ai/code/session_01DRbKLVDX9PNyNdXwuNqTDp
---
 tests/benchmark/run.py             | 140 ++++++++++++++++++++++++++++-
 tests/test_benchmark_regression.py |  25 ++++++
 2 files changed, 161 insertions(+), 4 deletions(-)

diff --git a/tests/benchmark/run.py b/tests/benchmark/run.py
index bfacb33..db7dd9d 100644
--- a/tests/benchmark/run.py
+++ b/tests/benchmark/run.py
@@ -30,6 +30,7 @@
 from __future__ import annotations
 
 import json
+import os
 import shutil
 import time
 from collections.abc import Iterable
@@ -331,6 +332,80 @@ def memory_stats() -> dict:
     }
 
 
+# ----------------------------------------------------------- phase 3 (synapses)
+
+# Realistic "files edited together in one session" groups. The point is to
+# teach the synapse graph cross-cutting associations a *textual* search
+# wouldn't recover: users/crud.py and db/connection.py are hubs touched
+# alongside almost every feature, even though the words "authentication" or
+# "billing" never appear in them. A query like "how does auth work?" should,
+# once the graph is warm, surface users/crud.py via the learned edge.
+SYNAPSE_SESSIONS = [
+    ["auth/handlers.py", "auth/jwt_utils.py", "users/crud.py"],
+    ["billing/stripe_client.py", "billing/invoices.py", "users/crud.py"],
+    ["api/routes.py", "users/crud.py"],
+    ["users/crud.py", "db/connection.py"],
+    ["billing/stripe_client.py", "db/connection.py"],
+]
+SYNAPSE_SESSION_REPEATS = 8
+
+
+def seed_synapses(nm: NeuralMind) -> int:
+    """Reinforce co-editing sessions directly into the synapse store.
+
+    Uses ``activate_files`` (the same entry point the file watcher calls)
+    so we exercise the real reinforcement path, not a test shim. Returns
+    the synapse edge count after seeding.
+    """
+    for _ in range(SYNAPSE_SESSION_REPEATS):
+        for session in SYNAPSE_SESSIONS:
+            nm.activate_files(session)
+    store = nm.synapses
+    return store.stats().get("edges", 0) if store else 0
+
+
+def run_synapse_phase(
+    nm: NeuralMind,
+    queries: list[dict],
+    naive_total: int,
+    inject: bool,
+) -> PhaseResult:
+    """Measure the query set with synapse recall toggled on or off.
+
+    Reads through ``selector.get_query_context`` rather than ``nm.query``
+    so measurement doesn't reinforce the graph mid-run — the only thing
+    that differs between the two passes is NEURALMIND_SYNAPSE_INJECT.
+    """
+    prev = os.environ.get("NEURALMIND_SYNAPSE_INJECT")
+    os.environ["NEURALMIND_SYNAPSE_INJECT"] = "1" if inject else "0"
+    try:
+        result = PhaseResult(phase="synapse-on" if inject else "synapse-off")
+        enc = _enc()
+        for q in queries:
+            ctx = nm.selector.get_query_context(q["question"])
+            after_tokens = len(enc.encode(ctx.context))
+            hits = top_k_modules(ctx.context)
+            result.queries.append(
+                QueryResult(
+                    id=q["id"],
+                    question=q["question"],
+                    shape=q["shape"],
+                    naive_tokens=naive_total,
+                    neuralmind_tokens=after_tokens,
+                    reduction_ratio=naive_total / max(after_tokens, 1),
+                    expected_modules=q["expected_modules"],
+                    hit_modules=hits,
+                    top_k_hit_rate=hit_rate(q["expected_modules"], hits),
+                )
+            )
+        return result
+    finally:
+        if prev is None:
+            os.environ.pop("NEURALMIND_SYNAPSE_INJECT", None)
+        else:
+            os.environ["NEURALMIND_SYNAPSE_INJECT"] = prev
+
+
 # --------------------------------------------------------------- report writer
 
 
@@ -350,7 +425,14 @@ def _dollars_saved(naive_tokens: int, neuralmind_tokens: int, queries_per_day: i
     return per_query_savings * queries_per_day * 30
 
 
-def write_results(phase1: PhaseResult, phase2: PhaseResult, mem: dict) -> None:
+def write_results(
+    phase1: PhaseResult,
+    phase2: PhaseResult,
+    mem: dict,
+    synapse_off: PhaseResult,
+    synapse_on: PhaseResult,
+    synapse_edges: int,
+) -> None:
     """Write the JSON payload consumed by the chart script and CI."""
     payload = {
         "version": 1,
@@ -368,6 +450,16 @@ def write_results(phase1: PhaseResult, phase2: PhaseResult, mem: dict) -> None:
             "uplift_reduction_ratio": phase2.avg_reduction - phase1.avg_reduction,
             "uplift_hit_rate": phase2.avg_hit_rate - phase1.avg_hit_rate,
         },
+        "phase3_synapse": {
+            "synapse_edges": synapse_edges,
+            "off_avg_reduction_ratio": synapse_off.avg_reduction,
+            "off_avg_top_k_hit_rate": synapse_off.avg_hit_rate,
+            "on_avg_reduction_ratio": synapse_on.avg_reduction,
+            "on_avg_top_k_hit_rate": synapse_on.avg_hit_rate,
+            "uplift_hit_rate": synapse_on.avg_hit_rate - synapse_off.avg_hit_rate,
+            "reduction_delta": synapse_on.avg_reduction - synapse_off.avg_reduction,
+            "queries": [asdict(q) for q in synapse_on.queries],
+        },
         "memory": mem,
         "regression_floor": REDUCTION_FLOOR,
         "pass": phase1.avg_reduction >= REDUCTION_FLOOR,
@@ -384,7 +476,14 @@ def write_results(phase1: PhaseResult, phase2: PhaseResult, mem: dict) -> None:
     RESULTS_PATH.write_text(json.dumps(payload, indent=2))
 
 
-def write_report(phase1: PhaseResult, phase2: PhaseResult, mem: dict) -> None:
+def write_report(
+    phase1: PhaseResult,
+    phase2: PhaseResult,
+    mem: dict,
+    synapse_off: PhaseResult,
+    synapse_on: PhaseResult,
+    synapse_edges: int,
+) -> None:
     """Write the human-readable Markdown report posted as a PR comment."""
     status = "PASS" if phase1.avg_reduction >= REDUCTION_FLOOR else "FAIL"
     savings = _dollars_saved(
@@ -430,6 +529,22 @@ def write_report(phase1: PhaseResult, phase2: PhaseResult, mem: dict) -> None:
         "verify the learning mechanism persists and applies. On real production repos the lift",
         "is larger; this test only catches regressions in persistence.",
         "",
+        "### Phase 3 — Synapse recall A/B (same warm graph, recall off vs on)",
+        "",
+        f"- Synapse edges after seeding co-editing sessions: `{synapse_edges}`",
+        f"- Top-k hit rate: **{_fmt_pct(synapse_off.avg_hit_rate)}** off → "
+        f"**{_fmt_pct(synapse_on.avg_hit_rate)}** on "
+        f"(Δ {(synapse_on.avg_hit_rate - synapse_off.avg_hit_rate) * 100:+.1f} points)",
+        f"- Reduction ratio: **{synapse_off.avg_reduction:.1f}×** off → "
+        f"**{synapse_on.avg_reduction:.1f}×** on "
+        f"(Δ {synapse_on.avg_reduction - synapse_off.avg_reduction:+.2f}× — "
+        "budget-neutral by design)",
+        "",
+        "This isolates the Hebbian synapse layer from the `learned_patterns` reranker in",
+        "Phase 2. The hit-rate delta shows associative recall surfacing co-edited modules a",
+        "purely textual search ranks lower; the near-zero reduction delta confirms it does so",
+        "without spending extra tokens (recalled nodes displace the weakest hits, not add to them).",
+        "",
         "### Assumptions",
         "",
         "- Baseline: every `.py` file in `tests/fixtures/sample_project/` concatenated.",
@@ -478,8 +593,18 @@ def main() -> int:
     phase2 = run_phase(nm, queries, naive_total, phase_name="warm")
     mem = memory_stats()
 
-    write_results(phase1, phase2, mem)
-    write_report(phase1, phase2, mem)
+    # Phase 3 — synapse recall A/B. Reinforce co-editing sessions, then
+    # measure the same queries with synapse recall off vs on. Isolates the
+    # synapse layer (Phase 2's lift also includes the learned_patterns
+    # reranker), and verifies the boost is budget-neutral (reduction holds).
+    reset_memory()
+    nm = NeuralMind(str(FIXTURE_DIR))
+    synapse_edges = seed_synapses(nm)
+    synapse_off = run_synapse_phase(nm, queries, naive_total, inject=False)
+    synapse_on = run_synapse_phase(nm, queries, naive_total, inject=True)
+
+    write_results(phase1, phase2, mem, synapse_off, synapse_on, synapse_edges)
+    write_report(phase1, phase2, mem, synapse_off, synapse_on, synapse_edges)
 
     print(
         f"Phase 1: {phase1.avg_reduction:.1f}× reduction, "
@@ -491,6 +616,13 @@ def main() -> int:
         f"{phase2.avg_hit_rate * 100:.0f}% top-k hit rate "
         f"(Δ {phase2.avg_reduction - phase1.avg_reduction:+.2f}×)"
     )
+    print(
+        f"Phase 3: synapse off {synapse_off.avg_hit_rate * 100:.0f}% → "
+        f"on {synapse_on.avg_hit_rate * 100:.0f}% hit rate "
+        f"(Δ {(synapse_on.avg_hit_rate - synapse_off.avg_hit_rate) * 100:+.0f}pts), "
+        f"reduction {synapse_off.avg_reduction:.1f}× → {synapse_on.avg_reduction:.1f}×, "
+        f"{synapse_edges} edges"
+    )
     print(f"Memory: {mem['events_logged']} events, {mem['patterns_learned']} patterns")
 
     return 0 if phase1.avg_reduction >= REDUCTION_FLOOR else 1
diff --git a/tests/test_benchmark_regression.py b/tests/test_benchmark_regression.py
index c4b36bd..15cc38f 100644
--- a/tests/test_benchmark_regression.py
+++ b/tests/test_benchmark_regression.py
@@ -63,6 +63,31 @@ def test_top_k_hit_rate_above_floor(benchmark_results):
     )
 
 
+def test_synapse_recall_does_not_reduce_hit_rate(benchmark_results):
+    """Synapse recall must never make retrieval worse.
+
+    Budget-neutral displacement could in principle drop a relevant vector
+    hit for a co-activated-but-wrong one. This gate catches that: with the
+    same warm graph, recall on must surface at least as many expected
+    modules as recall off.
+    """
+    p3 = benchmark_results["phase3_synapse"]
+    assert p3["on_avg_top_k_hit_rate"] >= p3["off_avg_top_k_hit_rate"] - 1e-9, (
+        f"Synapse recall lowered hit rate: {p3['off_avg_top_k_hit_rate']:.2%} off → "
+        f"{p3['on_avg_top_k_hit_rate']:.2%} on. Displacement is dropping relevant hits."
+    )
+
+
+def test_synapse_recall_is_budget_neutral(benchmark_results):
+    """Synapse recall reshapes selection without growing the token budget."""
+    p3 = benchmark_results["phase3_synapse"]
+    assert abs(p3["reduction_delta"]) <= 0.5, (
+        f"Synapse recall moved the reduction ratio by {p3['reduction_delta']:+.2f}× "
+        f"({p3['off_avg_reduction_ratio']:.1f}× off → {p3['on_avg_reduction_ratio']:.1f}× on). "
+        "It should be budget-neutral — recalled nodes displace, not append."
+    )
+
+
 def test_every_query_has_at_least_one_module_hit(benchmark_results):
     """No single query should return zero relevant modules."""
     zero_hit = [

From eb2246605f072ab29744f8d591ec65631737ac0c Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 20 May 2026 15:47:29 +0000
Subject: [PATCH 4/4] Harden synapse boost: copy results, guard id lookup
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Address two review findings on the synapse retrieval path:

- The boost incremented score on result dicts that _fetch_search caches and
  reuses, so repeated calls compounded the boost and corrupted cached vector
  scores. Operate on shallow copies — the boost is now idempotent and leaves
  the cache clean.
- Pull-in called get_nodes_by_ids unconditionally, which only GraphEmbedder
  implements; an embedder without it would raise AttributeError mid-query.
  Guard with a capability check and degrade to boost-only.

https://claude.ai/code/session_01DRbKLVDX9PNyNdXwuNqTDp
---
 neuralmind/context_selector.py | 12 +++++++++++-
 tests/test_context_selector.py | 35 ++++++++++++++++++++++++++++++++++
 2 files changed, 46 insertions(+), 1 deletion(-)

diff --git a/neuralmind/context_selector.py b/neuralmind/context_selector.py
index 6073c87..e7a76fe 100644
--- a/neuralmind/context_selector.py
+++ b/neuralmind/context_selector.py
@@ -459,6 +459,10 @@ def _apply_synapse_boost(self, results: list[dict]) -> list[dict]:
         if not energy:
             return results
 
+        # Work on shallow copies: _fetch_search caches and reuses these dicts,
+        # so mutating score in place would compound across calls and corrupt
+        # the cached vector scores. Copies keep the boost idempotent.
+        results = [dict(r) for r in results]
         seed_set = set(seeds)
         present = {r.get("id") for r in results}
 
@@ -479,6 +483,12 @@ def _apply_synapse_boost(self, results: list[dict]) -> list[dict]:
         # (b) Swap the weakest vector hits for the strongest absent neighbors.
         #     Displacement keeps the result count fixed, so the token budget
         #     is unchanged — we trade the least-relevant hits, not add to them.
+        #     Requires the embedder to support id lookup; if it doesn't (e.g. a
+        #     backend without get_nodes_by_ids), degrade to boost-only.
+        get_nodes_by_ids = getattr(self.embedder, "get_nodes_by_ids", None)
+        if not callable(get_nodes_by_ids):
+            return results
+
         candidates = sorted(
             (
                 (nid, e)
@@ -498,7 +508,7 @@ def _apply_synapse_boost(self, results: list[dict]) -> list[dict]:
         if num_swap <= 0:
             return results
         energy_by_id = dict(candidates[:num_swap])
-        fetched = self.embedder.get_nodes_by_ids(list(energy_by_id))
+        fetched = get_nodes_by_ids(list(energy_by_id))
         if not fetched:
             return results
 
diff --git a/tests/test_context_selector.py b/tests/test_context_selector.py
index 696f544..ce2bff2 100644
--- a/tests/test_context_selector.py
+++ b/tests/test_context_selector.py
@@ -842,6 +842,41 @@ def test_kill_switch_disables_boost(self, mock_embedder, temp_project, monkeypat
         assert text.index("**top**") < text.index("**mid**") < text.index("**low**")
         assert "synapse" not in text
 
+    def test_boost_does_not_mutate_cached_results(self, mock_embedder, temp_project):
+        """Boosting must not compound or contaminate the cached vector hits."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        # node_low is present and a non-seed, so path (a) boosts it.
+        selector.synapse_recall = lambda seeds: [("node_low", 1.0)]
+
+        text_first, _ = selector.get_l3_search("query", n=4)
+        text_second, _ = selector.get_l3_search("query", n=4)
+
+        # Idempotent: a second call yields identical output (no compounding).
+        assert text_first == text_second
+        # Cached dicts keep their original vector scores, uncontaminated.
+        cached = selector._query_search_cache["query"]
+        low = next(r for r in cached if r["id"] == "node_low")
+        assert low["score"] == 0.50
+        assert "_synapse_boost" not in low
+
+    def test_pull_in_degrades_without_id_lookup(self, mock_embedder, temp_project):
+        """If the embedder lacks get_nodes_by_ids, pull-in is skipped, not fatal."""
+        from neuralmind.context_selector import ContextSelector
+
+        self._four_hit_embedder(mock_embedder)
+        mock_embedder.get_nodes_by_ids = None  # backend without id lookup
+        selector = ContextSelector(mock_embedder, str(temp_project), enable_reranking=False)
+        selector.synapse_recall = lambda seeds: [("node_absent", 1.0)]
+
+        text, hits = selector.get_l3_search("query", n=4)
+
+        # No crash, no displacement — boost-only fallback.
+        assert hits == 4
+        assert "[recalled]" not in text
+
     def test_recall_exception_is_swallowed(self, mock_embedder, temp_project):
         """A failing recall callable must not break retrieval."""
         from neuralmind.context_selector import ContextSelector