diff --git a/sdk/mkdocs.yml b/sdk/mkdocs.yml
new file mode 100644
index 00000000..e2a16363
--- /dev/null
+++ b/sdk/mkdocs.yml
@@ -0,0 +1,78 @@
+site_name: Gradata
+site_description: AI behavioral adaptation engine. Corrections graduate into rules.
+repo_url: https://github.com/gradata-systems/gradata
+repo_name: gradata-systems/gradata
+
+theme:
+  name: material
+  palette:
+    - scheme: slate
+      primary: deep purple
+      accent: amber
+      toggle:
+        icon: material/brightness-4
+        name: Light mode
+    - scheme: default
+      primary: deep purple
+      accent: amber
+      toggle:
+        icon: material/brightness-7
+        name: Dark mode
+  features:
+    - navigation.instant
+    - navigation.tracking
+    - navigation.sections
+    - navigation.expand
+    - content.code.copy
+    - content.code.annotate
+    - search.highlight
+
+nav:
+  - Home: index.md
+  - Getting Started:
+    - Installation: getting-started/install.md
+    - Quick Start: getting-started/quickstart.md
+    - Core Concepts: getting-started/concepts.md
+  - Gradata Cloud:
+    - Overview: cloud/overview.md
+    - Getting Started: cloud/quickstart.md
+    - API Reference: cloud/api.md
+    - Marketplace: cloud/marketplace.md
+  - Guides:
+    - Training a Brain: guides/training.md
+    - Custom Domains: guides/custom-domains.md
+    - MCP Integration: guides/mcp.md
+  - API Reference:
+    - Brain Class: api/brain.md
+    - CLI: api/cli.md
+  - Contributing:
+    - Architecture: architecture/overview.md
+    - Patterns: architecture/patterns.md
+    - Enhancements: architecture/enhancements.md
+    - Brain Data: architecture/brain.md
+    - Agent Adaptation: architecture/agent-graduation.md
+    - Patterns API: api/patterns.md
+    - Enhancements API: api/enhancements.md
+    - Agent Adaptation Guide: guides/agent-graduation.md
+
+plugins:
+  - search
+  - mkdocstrings:
+      handlers:
+        python:
+          paths: [src]
+          options:
+            show_source: false
+            show_root_heading: true
+            heading_level: 2
+
+markdown_extensions:
+  - admonition
+  - pymdownx.details
+  - pymdownx.superfences
+  - pymdownx.highlight:
+      anchor_linenums: true
+  - pymdownx.tabbed:
+      alternate_style: true
+  - toc:
+      permalink: true
diff --git a/src/gradata/_core.py b/src/gradata/_core.py
index 825d72ce..643d1ed9 100644
--- a/src/gradata/_core.py
+++ b/src/gradata/_core.py
@@ -377,6 +377,29 @@ def brain_correct(
     except Exception as e:
         _log.debug("Domain fire attribution failed: %s", e)
 
+    # Self-healing: detect rule failures
+    try:
+        from gradata.enhancements.self_healing import detect_rule_failure
+
+        all_lessons = brain._load_lessons()
+        failure = detect_rule_failure(
+            lessons=all_lessons,
+            correction_category=category or "UNKNOWN",
+            correction_description=desc or summary or "",
+        )
+        if failure:
+            failure["correction_event_id"] = event.get("id")
+            failure["correction_severity"] = diff.severity
+            brain.emit(
+                "RULE_FAILURE", "brain.correct:self_healing",
+                failure,
+                [f"category:{failure['failed_rule_category']}", "self_healing"],
+                session,
+            )
+            event["rule_failure_detected"] = True
+    except Exception as e:
+        _log.debug("Self-healing detection failed: %s", e)
+
     # Persist rule graph
     if hasattr(brain, '_rule_graph') and brain._rule_graph:
         with contextlib.suppress(Exception):
diff --git a/src/gradata/brain.py b/src/gradata/brain.py
index 2d882cec..db241e7c 100644
--- a/src/gradata/brain.py
+++ b/src/gradata/brain.py
@@ -336,6 +336,48 @@ def correct(self, draft: str, final: str, category: str | None = None,
                              approval_required=approval_required, dry_run=dry_run,
                              min_severity=min_severity, scope=scope)
 
+    def patch_rule(self, category: str, old_description: str, new_description: str,
+                   reason: str = "") -> dict:
+        """Rewrite a rule's description. Preserves confidence/metadata. Emits RULE_PATCHED event."""
+        from gradata._db import write_lessons_safe
+        from gradata.enhancements.self_healing import apply_patch
+        from gradata.enhancements.self_improvement import format_lessons, parse_lessons
+
+        # Only patch the brain-local lessons file — never external fallbacks
+        lessons_path = self.dir / "lessons.md"
+        if not lessons_path.is_file():
+            return {"patched": False, "error": "not_found: no brain-local lessons file"}
+
+        lessons = parse_lessons(lessons_path.read_text(encoding="utf-8"))
+        patched = apply_patch(lessons, category, old_description, new_description)
+
+        if not patched:
+            return {"patched": False, "error": f"not_found: no rule matching category={category!r}"}
+
+        write_lessons_safe(lessons_path, format_lessons(lessons))
+
+        # Re-sign the patched rule so HMAC verification stays valid
+        try:
+            from gradata.enhancements.rule_integrity import sign_and_store
+            sign_and_store(self.db_path, new_description, category, patched.confidence)
+        except ImportError:
+            pass  # unsigned mode — no-op
+
+        self.emit("RULE_PATCHED", "brain.patch_rule", {
+            "category": category,
+            "old_description": old_description[:200],
+            "new_description": new_description[:200],
+            "reason": reason,
+            "confidence_preserved": patched.confidence,
+        }, [f"category:{category}", "self_healing"])
+
+        return {
+            "patched": True,
+            "old_description": old_description,
+            "new_description": new_description,
+            "confidence_preserved": patched.confidence,
+        }
+
     def end_session(self, session_corrections: list[dict] | None = None,
                     session_type: str = "full", machine_mode: bool | None = None,
                     skip_meta_rules: bool = False) -> dict:
@@ -665,6 +707,7 @@ def review_pending(self) -> list[dict]:
             import sqlite3
 
             from gradata._db import get_connection
+
             conn = get_connection(self.db_path)
             conn.row_factory = sqlite3.Row
             rows = conn.execute(
diff --git a/src/gradata/enhancements/rule_canary.py b/src/gradata/enhancements/rule_canary.py
index b9d85358..38f7da20 100644
--- a/src/gradata/enhancements/rule_canary.py
+++ b/src/gradata/enhancements/rule_canary.py
@@ -78,6 +78,7 @@ def _get_db_path(ctx=None) -> Path:
             return p
 
     # 3. Relative traversal (SDK installed alongside brain)
+    # Expects: src/gradata/enhancements/rule_canary.py -> 5 parents -> repo/brain/
     try:
         scripts_dir = Path(__file__).resolve().parent.parent.parent.parent.parent / "brain"
         p = scripts_dir / "system.db"
@@ -148,8 +149,9 @@ def check_canary_health(rule_category: str, session: int, db_path: Path | None =
             try:
                 corr_row = conn.execute(
                     "SELECT COUNT(*) as cnt FROM events WHERE type = 'CORRECTION' "
-                    "AND data_json LIKE ? AND CAST(session AS INTEGER) >= ?",
-                    (f'%"{rule_category}"%', start_session),
+                    "AND json_extract(data_json, '$.rule_category') = ? "
+                    "AND CAST(session AS INTEGER) >= ?",
+                    (rule_category, start_session),
                 ).fetchone()
                 if corr_row:
                     correction_count = corr_row["cnt"]
diff --git a/src/gradata/enhancements/rule_integrity.py b/src/gradata/enhancements/rule_integrity.py
index d705d075..7348489a 100644
--- a/src/gradata/enhancements/rule_integrity.py
+++ b/src/gradata/enhancements/rule_integrity.py
@@ -139,6 +139,10 @@ def sign_lesson_file(lessons_path: Path) -> dict[str, str]:
     Parses lesson lines matching [STATE:CONF] CATEGORY: description
     and returns a {category: signature} map.
 
+    Note: Only the *last* rule per category is retained. This is intentional —
+    graduation produces one canonical rule per category, so duplicates indicate
+    stale entries. The returned dict is keyed by category for O(1) lookup.
+
     Args:
         lessons_path: Path to lessons.md file.
 
@@ -208,8 +212,7 @@ def verify_lesson_file(lessons_path: Path, signatures: dict[str, str]) -> list[s
 
 def _ensure_table(db_path: Path) -> None:
     """Create rule_signatures table if it doesn't exist."""
-    conn = sqlite3.connect(str(db_path))
-    try:
+    with sqlite3.connect(str(db_path)) as conn:
         conn.execute("""
             CREATE TABLE IF NOT EXISTS rule_signatures (
                 category TEXT PRIMARY KEY,
@@ -218,8 +221,6 @@ def _ensure_table(db_path: Path) -> None:
             )
         """)
         conn.commit()
-    finally:
-        conn.close()
 
 
 def store_signature(db_path: Path, category: str, signature: str) -> None:
diff --git a/src/gradata/enhancements/self_healing.py b/src/gradata/enhancements/self_healing.py
new file mode 100644
index 00000000..84060762
--- /dev/null
+++ b/src/gradata/enhancements/self_healing.py
@@ -0,0 +1,389 @@
+"""
+Self-Healing Engine — Detects rule failures, generates patches, gates them through graduation.
+
+When a RULE (confidence >= 0.80) fails to prevent a correction it covers,
+this module:
+  1. Detects the failure (detect_rule_failure)
+  2. Generates a candidate patch via deterministic heuristic (generate_patch_candidate)
+  3. Gates the candidate via retroactive test (retroactive_test)
+  4. If it passes, enters the graduation pipeline as INSTINCT
+
+Architecture: LLM-whim as diagnostician, pipeline as validator. Nothing
+touches production rules without surviving graduation.
+"""
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+if TYPE_CHECKING:
+    from gradata._types import Lesson
+
+# Only RULE state with confidence >= this threshold triggers self-healing
+DEFAULT_MIN_CONFIDENCE = 0.80
+
+
+def detect_rule_failure(
+    lessons: list[Lesson],
+    correction_category: str,
+    correction_description: str,
+    min_confidence: float = DEFAULT_MIN_CONFIDENCE,
+    memory_context: dict | None = None,
+) -> dict | None:
+    """Check if an existing RULE covers this correction category.
+
+    If a RULE with confidence >= min_confidence exists for this category,
+    it should have prevented this correction. Its failure to do so is a
+    RULE_FAILURE event.
+
+    Args:
+        lessons: All current lessons from the brain.
+        correction_category: Category of the correction (e.g. "TONE").
+        correction_description: What the correction was about.
+        min_confidence: Minimum confidence for a rule to be considered
+            (default 0.80 -- rules below this are still maturing).
+        memory_context: Optional dict of active memories/domain context
+            at the time of failure. Captured for richer diagnosis.
+
+    Returns:
+        Dict with failure details if a covering rule was found, None otherwise.
+    """
+    from gradata._types import LessonState
+
+    cat = correction_category.upper()
+    candidates = [
+        l for l in lessons
+        if l.state == LessonState.RULE
+        and l.confidence >= min_confidence
+        and l.category.upper() == cat
+    ]
+
+    if not candidates:
+        return None
+
+    # Pick the highest-confidence rule -- it's the one that should have caught this
+    failed_rule = max(candidates, key=lambda l: l.confidence)
+
+    result = {
+        "failed_rule_category": cat,
+        "failed_rule_description": failed_rule.description,
+        "failed_rule_confidence": failed_rule.confidence,
+        "failed_rule_fire_count": failed_rule.fire_count,
+        "correction_description": correction_description,
+    }
+    if memory_context:
+        result["memory_context"] = memory_context
+
+    return result
+
+
+def apply_patch(
+    lessons: list[Lesson],
+    category: str,
+    old_description: str,
+    new_description: str,
+) -> Lesson | None:
+    """Find and patch a rule's description. Returns the patched lesson or None.
+
+    Preserves: confidence, fire_count, state, date, all metadata.
+    Changes: description only.
+    """
+    cat = category.upper()
+    for lesson in lessons:
+        if (lesson.category.upper() == cat
+                and lesson.description.strip() == old_description.strip()):
+            lesson.description = new_description
+            return lesson
+    return None
+
+
+def retroactive_test(
+    original_rule_desc: str,
+    proposed_patch_desc: str,
+    correction_description: str,
+) -> dict:
+    """Gate: does the proposed patch's DELTA cover the failure?
+
+    Compares the *new content added by the patch* (the delta between
+    original and proposed) against the correction description. This tests
+    whether the qualifying language the patch introduces is relevant to
+    the failure context -- not just whether the whole rule overlaps.
+
+    No LLM calls. The failure record IS the test.
+
+    Returns:
+        {"passes": bool, "delta_score": float, "delta_text": str, "reason": str}
+    """
+    if proposed_patch_desc.strip() == original_rule_desc.strip():
+        return {
+            "passes": False,
+            "delta_score": 0.0,
+            "delta_text": "",
+            "reason": "Patch identical to original rule -- no improvement",
+        }
+
+    # Extract the delta: words in the patch that aren't in the original
+    original_words = set(original_rule_desc.lower().split())
+    patch_words = proposed_patch_desc.lower().split()
+    delta_words = [w for w in patch_words if w not in original_words]
+    delta_text = " ".join(delta_words)
+
+    if not delta_text.strip():
+        return {
+            "passes": False,
+            "delta_score": 0.0,
+            "delta_text": "",
+            "reason": "No new content in patch",
+        }
+
+    # Check if the delta is relevant to the correction
+    # Use both TF-IDF similarity and simple word-stem overlap for short texts
+    from gradata.enhancements.similarity import best_similarity
+    sim = best_similarity(delta_text, correction_description)
+
+    # Fallback: word-stem overlap (handles "emails" vs "email", short deltas)
+    delta_stems = {w[:5] for w in delta_text.lower().split() if len(w) >= 3}
+    correction_stems = {w[:5] for w in correction_description.lower().split() if len(w) >= 3}
+    stem_overlap = len(delta_stems & correction_stems) / max(len(delta_stems), 1)
+    score = max(sim, stem_overlap)
+
+    threshold = 0.20  # Lower threshold since delta is shorter text
+    passes = score >= threshold
+
+    return {
+        "passes": passes,
+        "delta_score": round(score, 3),
+        "delta_text": delta_text,
+        "reason": "Patch delta covers failure" if passes else f"Delta irrelevant ({score:.3f} < {threshold})",
+    }
+
+
+def _generate_deterministic_patch(
+    rule_description: str,
+    correction_description: str,
+) -> str:
+    """Generate a narrowed rule description without LLM.
+
+    Heuristic: append the correction context as a qualifying clause.
+    This is the deterministic fallback. LLM refinement is Phase 2.
+    """
+    correction_lower = correction_description.lower()
+    rule_lower = rule_description.lower()
+
+    # Find words in correction that aren't in the rule -- these are the context
+    rule_words = set(rule_lower.split())
+    correction_words = set(correction_lower.split())
+    new_context_words = correction_words - rule_words - {
+        "the", "a", "an", "in", "on", "at", "to", "for", "of", "is", "was",
+        "from", "with", "and", "or", "but", "not", "this", "that",
+    }
+
+    if not new_context_words:
+        return rule_description  # Can't narrow -- return unchanged
+
+    # Take top 3 most informative context words
+    context_phrase = " ".join(list(new_context_words)[:3])
+    return f"{rule_description} (especially in context: {context_phrase})"
+
+
+def review_rule_failures(
+    failure_events: list[dict],
+) -> list[dict]:
+    """Analyze RULE_FAILURE events and generate patch candidates.
+
+    Each candidate includes:
+      - category, original_description, proposed_description
+      - retroactive_test result (must pass to enter pipeline)
+
+    This is the background review fork (Hermes pattern).
+    """
+    if not failure_events:
+        return []
+
+    patches = []
+    for event in failure_events:
+        data = event.get("data", {})
+        category = data.get("failed_rule_category", "")
+        original = data.get("failed_rule_description", "")
+        correction = data.get("correction_description", "")
+
+        if not category or not original:
+            continue
+
+        proposed = _generate_deterministic_patch(original, correction)
+
+        test_result = retroactive_test(original, proposed, correction)
+
+        patches.append({
+            "category": category,
+            "original_description": original,
+            "proposed_description": proposed,
+            "correction_description": correction,
+            "retroactive_test": test_result,
+        })
+
+    return patches
+
+
+# ── Nudging ────────────────────────────────────────────────────────────
+
+NUDGE_THRESHOLD = 3  # Corrections before nudging
+
+
+def _find_centroid(descriptions: list[str]) -> str:
+    """Find the most representative description (highest avg similarity to others)."""
+    if len(descriptions) <= 1:
+        return descriptions[0] if descriptions else ""
+
+    from gradata.enhancements.similarity import best_similarity
+
+    best_desc, best_avg = descriptions[0], 0.0
+    for desc in descriptions:
+        avg_sim = sum(best_similarity(desc, other) for other in descriptions if other != desc)
+        avg_sim /= max(len(descriptions) - 1, 1)
+        if avg_sim > best_avg:
+            best_avg = avg_sim
+            best_desc = desc
+    return best_desc
+
+
+def check_nudge_threshold(
+    correction_events: list[dict],
+    lessons: list[Lesson],
+    category: str,
+    threshold: int = NUDGE_THRESHOLD,
+) -> dict:
+    """Check if a category has enough corrections without a covering rule to trigger a nudge.
+
+    When triggered (A+B strategy):
+      - Proposes an INSTINCT lesson from the centroid correction (most representative)
+      - Marks it pending_approval=True so it won't graduate without validation
+
+    Returns:
+        {"should_nudge": bool, "correction_count": int, "centroid_description": str,
+         "proposed_lesson": dict | None, ...}
+    """
+    from gradata._types import LessonState
+
+    cat = category.upper()
+
+    # Collect corrections in this category
+    cat_corrections = [
+        e for e in correction_events
+        if (e.get("data", {}).get("category", "") or "").upper() == cat
+    ]
+    count = len(cat_corrections)
+
+    # Check if a RULE already covers this category
+    existing_rule = next(
+        (l for l in lessons
+         if l.category.upper() == cat
+         and l.state == LessonState.RULE
+         and l.confidence >= DEFAULT_MIN_CONFIDENCE),
+        None,
+    )
+
+    if existing_rule:
+        return {
+            "should_nudge": False,
+            "correction_count": count,
+            "centroid_description": "",
+            "proposed_lesson": None,
+            "existing_rule": existing_rule.description[:200],
+            "reason": "Rule already exists for this category",
+        }
+
+    should_nudge = count >= threshold
+    if not should_nudge:
+        return {
+            "should_nudge": False,
+            "correction_count": count,
+            "centroid_description": "",
+            "proposed_lesson": None,
+            "category": cat,
+            "reason": f"Below threshold ({count}/{threshold})",
+        }
+
+    # Find centroid: most representative correction description
+    descriptions = [
+        e.get("data", {}).get("summary", "") or e.get("data", {}).get("description", "")
+        for e in cat_corrections
+    ]
+    descriptions = [d for d in descriptions if d]
+    centroid = _find_centroid(descriptions) if descriptions else f"Repeated {cat.lower()} corrections"
+
+    # Propose an INSTINCT lesson with pending_approval
+    from gradata.enhancements.self_improvement import INITIAL_CONFIDENCE
+    proposed = {
+        "state": "INSTINCT",
+        "confidence": INITIAL_CONFIDENCE,
+        "category": cat,
+        "description": centroid,
+        "pending_approval": True,
+    }
+
+    return {
+        "should_nudge": True,
+        "correction_count": count,
+        "centroid_description": centroid,
+        "proposed_lesson": proposed,
+        "category": cat,
+        "reason": f"{count} corrections, threshold={threshold}",
+    }
+
+
+# ── Scope Narrowing (Phase 2 prep -- capture only) ────────────────────
+
+def narrow_rule_scope(
+    rule: Lesson,
+    failure_context: dict,
+) -> dict:
+    """Add a domain exclusion to a rule based on the context where it failed.
+
+    If a rule fires correctly in "sales email" but incorrectly in "casual slack",
+    the slack domain gets excluded. This is Phase 2 prep -- captures the signal
+    now, full scoped-brains implementation later.
+
+    Args:
+        rule: The rule that failed.
+        failure_context: Dict with domain/agent_type/memory info from the failure.
+
+    Returns:
+        {"narrowed": bool, "new_scope_json": str, ...}
+    """
+    import json
+
+    domain = failure_context.get("domain", "")
+    if not domain:
+        return {"narrowed": False, "reason": "No domain in failure context"}
+
+    # Parse existing scope
+    existing_scope: dict = {}
+    if rule.scope_json:
+        try:
+            existing_scope = json.loads(rule.scope_json)
+        except (json.JSONDecodeError, TypeError):
+            existing_scope = {}
+
+    excluded = existing_scope.get("excluded_domains", [])
+    if domain in excluded:
+        return {"narrowed": False, "reason": f"Domain {domain!r} already excluded"}
+
+    excluded.append(domain)
+    existing_scope["excluded_domains"] = excluded
+
+    # Capture memory context if present (memories as scoping signal)
+    if failure_context.get("active_memories"):
+        memory_exclusions = existing_scope.get("excluded_memory_contexts", [])
+        memory_exclusions.append({
+            "memories": failure_context["active_memories"],
+            "domain": domain,
+        })
+        existing_scope["excluded_memory_contexts"] = memory_exclusions
+
+    new_scope_json = json.dumps(existing_scope)
+
+    return {
+        "narrowed": True,
+        "new_scope_json": new_scope_json,
+        "excluded_domain": domain,
+    }
diff --git a/tests/test_self_healing.py b/tests/test_self_healing.py
new file mode 100644
index 00000000..dfdea84a
--- /dev/null
+++ b/tests/test_self_healing.py
@@ -0,0 +1,493 @@
+"""Tests for the self-healing engine."""
+from __future__ import annotations
+
+import pytest
+from gradata._types import Lesson, LessonState
+
+
+class TestDetectRuleFailure:
+    """detect_rule_failure: given lessons + a correction category, find rules that should have prevented it."""
+
+    def test_detects_failure_when_rule_covers_category(self):
+        from gradata.enhancements.self_healing import detect_rule_failure
+
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="TONE", description="Never use exclamation marks in emails",
+            fire_count=8,
+        )
+        result = detect_rule_failure(
+            lessons=[rule],
+            correction_category="TONE",
+            correction_description="Removed exclamation marks from email draft",
+            min_confidence=0.80,
+        )
+        assert result is not None
+        assert result["failed_rule_category"] == "TONE"
+        assert result["failed_rule_description"] == rule.description
+        assert result["failed_rule_confidence"] == 0.92
+
+    def test_returns_none_when_no_rule_covers_category(self):
+        from gradata.enhancements.self_healing import detect_rule_failure
+
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="FORMAT", description="Use bullet points in reports",
+            fire_count=5,
+        )
+        result = detect_rule_failure(
+            lessons=[rule],
+            correction_category="TONE",
+            correction_description="Fixed the tone",
+        )
+        assert result is None
+
+    def test_ignores_low_confidence_rules(self):
+        from gradata.enhancements.self_healing import detect_rule_failure
+
+        pattern = Lesson(
+            date="2026-04-01", state=LessonState.PATTERN, confidence=0.65,
+            category="TONE", description="Watch tone in emails",
+            fire_count=4,
+        )
+        result = detect_rule_failure(
+            lessons=[pattern],
+            correction_category="TONE",
+            correction_description="Fixed tone",
+            min_confidence=0.80,
+        )
+        assert result is None
+
+    def test_ignores_killed_rules(self):
+        from gradata.enhancements.self_healing import detect_rule_failure
+
+        killed = Lesson(
+            date="2026-04-01", state=LessonState.KILLED, confidence=0.95,
+            category="TONE", description="Old tone rule",
+            fire_count=10, kill_reason="manual_rollback",
+        )
+        result = detect_rule_failure(
+            lessons=[killed],
+            correction_category="TONE",
+            correction_description="Fixed tone",
+        )
+        assert result is None
+
+    def test_includes_memory_context_when_provided(self):
+        from gradata.enhancements.self_healing import detect_rule_failure
+
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="TONE", description="Never use exclamation marks",
+            fire_count=8,
+        )
+        memory_ctx = {"active_memories": ["user prefers formal tone"], "domain": "sales"}
+        result = detect_rule_failure(
+            lessons=[rule],
+            correction_category="TONE",
+            correction_description="Removed exclamation marks",
+            memory_context=memory_ctx,
+        )
+        assert result is not None
+        assert result["memory_context"] == memory_ctx
+
+    def test_picks_highest_confidence_rule_on_multi_match(self):
+        from gradata.enhancements.self_healing import detect_rule_failure
+
+        rule_a = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.91,
+            category="TONE", description="Be formal",
+            fire_count=6,
+        )
+        rule_b = Lesson(
+            date="2026-04-02", state=LessonState.RULE, confidence=0.95,
+            category="TONE", description="Never use slang",
+            fire_count=10,
+        )
+        result = detect_rule_failure(
+            lessons=[rule_a, rule_b],
+            correction_category="TONE",
+            correction_description="Removed slang",
+        )
+        assert result is not None
+        assert result["failed_rule_confidence"] == 0.95
+
+
+class TestBrainCorrectRuleFailure:
+    """brain.correct() emits RULE_FAILURE when a RULE should have caught the correction."""
+
+    @pytest.fixture
+    def brain_with_rule(self, tmp_path):
+        """Create a brain with a graduated RULE in TONE category."""
+        from gradata.brain import Brain
+        from gradata._types import Lesson, LessonState
+        from gradata.enhancements.self_improvement import format_lessons
+        from gradata._db import write_lessons_safe
+
+        brain = Brain.init(str(tmp_path / "test-brain"))
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="TONE", description="Never use exclamation marks in professional emails",
+            fire_count=8,
+        )
+        lessons_path = brain._find_lessons_path(create=True)
+        write_lessons_safe(lessons_path, format_lessons([rule]))
+        return brain
+
+    def test_correction_in_ruled_category_emits_rule_failure(self, brain_with_rule):
+        result = brain_with_rule.correct(
+            draft="Great to hear from you! Let's connect!",
+            final="Great to hear from you. Let's connect.",
+            category="TONE",
+        )
+        # Check that a RULE_FAILURE event was emitted
+        events = brain_with_rule.query_events(event_type="RULE_FAILURE", limit=10)
+        assert len(events) >= 1
+        failure = events[0]
+        assert failure["data"]["failed_rule_category"] == "TONE"
+        assert failure["data"]["failed_rule_confidence"] >= 0.80
+
+    def test_correction_in_unruled_category_no_rule_failure(self, brain_with_rule):
+        result = brain_with_rule.correct(
+            draft="wrong format", final="correct format",
+            category="FORMAT",
+        )
+        events = brain_with_rule.query_events(event_type="RULE_FAILURE", limit=10)
+        assert len(events) == 0
+
+
+class TestPatchRule:
+    """brain.patch_rule() rewrites a rule's description while preserving metadata."""
+
+    @pytest.fixture
+    def brain_with_rule(self, tmp_path):
+        from gradata.brain import Brain
+        from gradata._types import Lesson, LessonState
+        from gradata.enhancements.self_improvement import format_lessons
+        from gradata._db import write_lessons_safe
+
+        brain = Brain.init(str(tmp_path / "test-brain"))
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="TONE", description="Never use exclamation marks",
+            fire_count=8,
+        )
+        lessons_path = brain._find_lessons_path(create=True)
+        write_lessons_safe(lessons_path, format_lessons([rule]))
+        return brain
+
+    def test_patch_rewrites_description(self, brain_with_rule):
+        result = brain_with_rule.patch_rule(
+            category="TONE",
+            old_description="Never use exclamation marks",
+            new_description="Never use exclamation marks in professional emails (casual is OK)",
+            reason="Rule was too broad - failed on casual context",
+        )
+        assert result["patched"] is True
+        assert result["old_description"] == "Never use exclamation marks"
+        assert result["new_description"].startswith("Never use exclamation marks in professional")
+
+        # Verify the lesson was actually updated on disk
+        lessons = brain_with_rule._load_lessons()
+        tone_rules = [l for l in lessons if l.category == "TONE" and l.state.value == "RULE"]
+        assert len(tone_rules) == 1
+        assert "professional emails" in tone_rules[0].description
+
+    def test_patch_preserves_confidence_and_metadata(self, brain_with_rule):
+        result = brain_with_rule.patch_rule(
+            category="TONE",
+            old_description="Never use exclamation marks",
+            new_description="Avoid exclamation marks in formal contexts",
+            reason="Narrowing scope",
+        )
+        lessons = brain_with_rule._load_lessons()
+        tone_rules = [l for l in lessons if l.category == "TONE"]
+        assert tone_rules[0].confidence == 0.92
+        assert tone_rules[0].fire_count == 8
+
+    def test_patch_emits_rule_patched_event(self, brain_with_rule):
+        brain_with_rule.patch_rule(
+            category="TONE",
+            old_description="Never use exclamation marks",
+            new_description="Avoid exclamation marks in formal contexts",
+            reason="Too broad",
+        )
+        events = brain_with_rule.query_events(event_type="RULE_PATCHED", limit=10)
+        assert len(events) >= 1
+        assert events[0]["data"]["reason"] == "Too broad"
+
+    def test_patch_nonexistent_rule_returns_not_found(self, brain_with_rule):
+        result = brain_with_rule.patch_rule(
+            category="TONE",
+            old_description="This rule does not exist",
+            new_description="New version",
+            reason="test",
+        )
+        assert result["patched"] is False
+        assert "not_found" in result.get("error", "")
+
+
+class TestRetroactiveTest:
+    """retroactive_test: validate a proposed patch against the failure that triggered it."""
+
+    def test_patch_that_covers_failure_passes(self):
+        from gradata.enhancements.self_healing import retroactive_test
+
+        result = retroactive_test(
+            original_rule_desc="Never use exclamation marks",
+            proposed_patch_desc="Never use exclamation marks in professional emails",
+            correction_description="Removed exclamation marks from sales email draft",
+        )
+        assert result["passes"] is True
+
+    def test_patch_unrelated_to_failure_fails(self):
+        from gradata.enhancements.self_healing import retroactive_test
+
+        result = retroactive_test(
+            original_rule_desc="Use bullet points",
+            proposed_patch_desc="Use numbered lists instead of bullet points",
+            correction_description="Removed exclamation marks from email",
+        )
+        assert result["passes"] is False
+
+    def test_patch_identical_to_original_fails(self):
+        """If the patch is the same as the original, it can't help."""
+        from gradata.enhancements.self_healing import retroactive_test
+
+        result = retroactive_test(
+            original_rule_desc="Never use exclamation marks",
+            proposed_patch_desc="Never use exclamation marks",
+            correction_description="Removed exclamation marks",
+        )
+        assert result["passes"] is False
+
+    def test_delta_based_matching(self):
+        """The test should check the DELTA (new words in patch), not the whole patch."""
+        from gradata.enhancements.self_healing import retroactive_test
+
+        # The delta here is "professional emails" -- relevant to "sales email draft"
+        result = retroactive_test(
+            original_rule_desc="Never use exclamation marks",
+            proposed_patch_desc="Never use exclamation marks in professional emails",
+            correction_description="Removed exclamation marks from sales email draft",
+        )
+        assert result["passes"] is True
+        assert result.get("delta_text")  # Should expose what changed
+
+
+class TestReviewRuleFailures:
+    """review_rule_failures: analyze RULE_FAILURE events and produce patch candidates."""
+
+    def test_generates_patch_for_rule_failure(self):
+        from gradata.enhancements.self_healing import review_rule_failures
+
+        failures = [{
+            "data": {
+                "failed_rule_category": "TONE",
+                "failed_rule_description": "Never use exclamation marks",
+                "failed_rule_confidence": 0.92,
+                "correction_description": "Removed exclamation marks from casual Slack message",
+            }
+        }]
+        patches = review_rule_failures(failures)
+        assert len(patches) == 1
+        assert patches[0]["category"] == "TONE"
+        assert patches[0]["original_description"] == "Never use exclamation marks"
+        assert patches[0]["proposed_description"] != "Never use exclamation marks"
+        assert "retroactive_test" in patches[0]
+
+    def test_empty_failures_returns_empty(self):
+        from gradata.enhancements.self_healing import review_rule_failures
+
+        patches = review_rule_failures([])
+        assert patches == []
+
+    def test_filters_out_patches_failing_retroactive_test(self):
+        from gradata.enhancements.self_healing import review_rule_failures
+
+        # A failure where the correction has no new context words beyond
+        # stop words -- the heuristic can't narrow the rule so
+        # proposed == original and retroactive test rejects it
+        failures = [{
+            "data": {
+                "failed_rule_category": "TONE",
+                "failed_rule_description": "Use bullet points in reports",
+                "failed_rule_confidence": 0.90,
+                "correction_description": "Use bullet points in reports",
+            }
+        }]
+        patches = review_rule_failures(failures)
+        # The patch can't narrow (correction == rule), so it returns unchanged
+        passing = [p for p in patches if p.get("retroactive_test", {}).get("passes")]
+        assert len(passing) == 0
+
+
+class TestNudgeThreshold:
+    """check_nudge_threshold: 3+ corrections in a category with no rule -> nudge."""
+
+    def test_nudge_triggered_at_threshold(self):
+        from gradata.enhancements.self_healing import check_nudge_threshold
+
+        correction_events = [
+            {"data": {"category": "TONE", "summary": "Removed exclamation marks"}, "session": 1},
+            {"data": {"category": "TONE", "summary": "Toned down exclamation marks"}, "session": 2},
+            {"data": {"category": "TONE", "summary": "Removed exclamation marks from email"}, "session": 3},
+        ]
+        lessons = []  # No rules
+        result = check_nudge_threshold(correction_events, lessons, category="TONE")
+        assert result["should_nudge"] is True
+        assert result["correction_count"] == 3
+        assert result["centroid_description"]  # Should pick most representative
+
+    def test_no_nudge_below_threshold(self):
+        from gradata.enhancements.self_healing import check_nudge_threshold
+
+        correction_events = [
+            {"data": {"category": "TONE", "summary": "Fixed tone"}, "session": 1},
+            {"data": {"category": "TONE", "summary": "Fixed tone again"}, "session": 2},
+        ]
+        result = check_nudge_threshold(correction_events, [], category="TONE")
+        assert result["should_nudge"] is False
+
+    def test_no_nudge_when_rule_exists(self):
+        from gradata.enhancements.self_healing import check_nudge_threshold
+
+        correction_events = [
+            {"data": {"category": "TONE", "summary": "Fixed tone"}, "session": i} for i in range(5)
+        ]
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.90,
+            category="TONE", description="Watch your tone", fire_count=5,
+        )
+        result = check_nudge_threshold(correction_events, [rule], category="TONE")
+        assert result["should_nudge"] is False
+        assert "existing_rule" in result
+
+    def test_auto_creates_instinct_with_pending_approval(self):
+        """Nudge should auto-create an INSTINCT lesson from centroid, pending approval."""
+        from gradata.enhancements.self_healing import check_nudge_threshold
+
+        correction_events = [
+            {"data": {"category": "TONE", "summary": "Removed exclamation marks from email"}, "session": 1},
+            {"data": {"category": "TONE", "summary": "Toned down exclamation marks in draft"}, "session": 2},
+            {"data": {"category": "TONE", "summary": "Removed exclamation marks from sales email"}, "session": 3},
+        ]
+        result = check_nudge_threshold(correction_events, [], category="TONE")
+        assert result["should_nudge"] is True
+        assert result["proposed_lesson"] is not None
+        assert result["proposed_lesson"]["state"] == "INSTINCT"
+        assert result["proposed_lesson"]["pending_approval"] is True
+
+
+class TestNarrowRuleScope:
+    """narrow_rule_scope: when a rule fails in a specific context, add exclusion scope."""
+
+    def test_adds_domain_exclusion(self):
+        import json
+        from gradata.enhancements.self_healing import narrow_rule_scope
+
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="TONE", description="Never use exclamation marks",
+            fire_count=8, scope_json="",
+        )
+        result = narrow_rule_scope(
+            rule,
+            failure_context={"domain": "casual_slack", "agent_type": "chat"},
+        )
+        assert result["narrowed"] is True
+        scope = json.loads(result["new_scope_json"])
+        assert "casual_slack" in scope.get("excluded_domains", [])
+
+    def test_no_narrowing_without_context(self):
+        from gradata.enhancements.self_healing import narrow_rule_scope
+
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="TONE", description="Never use exclamation marks",
+            fire_count=8,
+        )
+        result = narrow_rule_scope(rule, failure_context={})
+        assert result["narrowed"] is False
+
+    def test_accumulates_exclusions(self):
+        import json
+        from gradata.enhancements.self_healing import narrow_rule_scope
+
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="TONE", description="Never use exclamation marks",
+            fire_count=8,
+            scope_json=json.dumps({"excluded_domains": ["casual_slack"]}),
+        )
+        result = narrow_rule_scope(
+            rule,
+            failure_context={"domain": "internal_notes"},
+        )
+        scope = json.loads(result["new_scope_json"])
+        assert "casual_slack" in scope["excluded_domains"]
+        assert "internal_notes" in scope["excluded_domains"]
+
+
+class TestSelfHealingE2E:
+    """Full flow: correct -> RULE_FAILURE detected -> patch generated -> rule updated."""
+
+    @pytest.fixture
+    def brain_with_rule(self, tmp_path):
+        from gradata.brain import Brain
+        from gradata._types import Lesson, LessonState
+        from gradata.enhancements.self_improvement import format_lessons
+        from gradata._db import write_lessons_safe
+
+        brain = Brain.init(str(tmp_path / "test-brain"))
+        rule = Lesson(
+            date="2026-04-01", state=LessonState.RULE, confidence=0.92,
+            category="TONE", description="Never use exclamation marks",
+            fire_count=8,
+        )
+        lessons_path = brain._find_lessons_path(create=True)
+        write_lessons_safe(lessons_path, format_lessons([rule]))
+        return brain
+
+    def test_full_self_healing_flow(self, brain_with_rule):
+        brain = brain_with_rule
+
+        # 1. Correction triggers RULE_FAILURE
+        result = brain.correct(
+            draft="Thanks for joining! Excited to work together!",
+            final="Thanks for joining. Excited to work together.",
+            category="TONE",
+        )
+        assert result.get("rule_failure_detected") is True
+
+        # 2. Verify RULE_FAILURE event was emitted
+        failures = brain.query_events(event_type="RULE_FAILURE", limit=10)
+        assert len(failures) >= 1
+
+        # 3. Review generates a patch
+        from gradata.enhancements.self_healing import review_rule_failures
+        patches = review_rule_failures(failures)
+        assert len(patches) >= 1
+
+        # 4. Apply passing patches via brain.patch_rule()
+        for patch in patches:
+            if patch.get("retroactive_test", {}).get("passes"):
+                brain.patch_rule(
+                    category=patch["category"],
+                    old_description=patch["original_description"],
+                    new_description=patch["proposed_description"],
+                    reason="E2E self-healing test",
+                )
+
+        # 5. Verify RULE_PATCHED event
+        patched_events = brain.query_events(event_type="RULE_PATCHED", limit=10)
+        # May or may not have patches depending on deterministic heuristic
+        # But the flow should complete without errors
+
+        # 6. Verify the lesson was updated (if patched)
+        if patched_events:
+            lessons = brain._load_lessons()
+            tone_rules = [l for l in lessons if l.category == "TONE"]
+            assert len(tone_rules) >= 1
+            # Confidence may drop due to correction penalty, but should still be high
+            assert tone_rules[0].confidence >= 0.70