Gradata · Gradata · May 26, 2026 · coderabbitai · May 26, 2026 · coderabbitai
diff --git a/Gradata/src/gradata/hooks/adapters/_base.py b/Gradata/src/gradata/hooks/adapters/_base.py
@@ -136,6 +136,27 @@ def hook_command(brain_dir: Path) -> str:
     )
 
 
+def auto_correct_command(brain_dir: Path) -> str:
+    return (
+        f"BRAIN_DIR={shlex.quote(str(brain_dir))} "
+        f"{shlex.quote(sys.executable)} -m gradata.hooks.auto_correct"
+    )
+
+
+def session_close_command(brain_dir: Path) -> str:
+    return (
+        f"BRAIN_DIR={shlex.quote(str(brain_dir))} "
+        f"{shlex.quote(sys.executable)} -m gradata.hooks.session_close"
+    )
+
+
+def pre_compact_command(brain_dir: Path) -> str:
+    return (
+        f"BRAIN_DIR={shlex.quote(str(brain_dir))} "
+        f"{shlex.quote(sys.executable)} -m gradata.hooks.pre_compact"
+    )
+
+
 def mcp_command(brain_dir: Path) -> list[str]:
     return [sys.executable, "-m", "gradata.mcp_server", "--brain-dir", str(brain_dir)]
 

diff --git a/Gradata/src/gradata/hooks/adapters/claude_code.py b/Gradata/src/gradata/hooks/adapters/claude_code.py
@@ -12,6 +12,7 @@
     failure,
     hook_command,
     hook_signature,
+    pre_compact_command,
     read_json,
     write_json,
 )
@@ -58,24 +59,41 @@ def install(brain_dir: Path, agent_config_path: Path) -> InstallResult:
         data = read_json(agent_config_path)
         hooks = data.setdefault("hooks", {})
         pre_tool = hooks.setdefault("PreToolUse", [])
-        if any(sig in str(item) for item in pre_tool):
+        pre_compact = hooks.setdefault("PreCompact", [])
+        has_pre_tool = any(sig in str(item) for item in pre_tool)
+        has_pre_compact = any(sig in str(item) for item in pre_compact)
+        if has_pre_tool and has_pre_compact:
             return InstallResult(
                 AGENT, agent_config_path, "already_present", "hook already present"
             )
-        pre_tool.append(
-            {
-                "matcher": "*",
-                "hooks": [
-                    {
-                        "type": "command",
-                        "command": hook_command(brain_dir),
-                        "id": sig,
-                    }
-                ],
-            }
-        )
+        if not has_pre_tool:
+            pre_tool.append(
+                {
+                    "matcher": "*",
+                    "hooks": [
+                        {
+                            "type": "command",
+                            "command": hook_command(brain_dir),
+                            "id": sig,
+                        }
+                    ],
+                }
+            )
+        if not has_pre_compact:
+            pre_compact.append(
+                {
+                    "matcher": "manual|auto",
+                    "hooks": [
+                        {
+                            "type": "command",
+                            "command": pre_compact_command(brain_dir),
+                            "id": sig,
+                        }
+                    ],
+                }
+            )
         write_json(agent_config_path, data)
-        return InstallResult(AGENT, agent_config_path, "added", "installed PreToolUse hook")
+        return InstallResult(AGENT, agent_config_path, "added", "installed Claude Code hooks")
     except Exception as exc:
         return failure(AGENT, agent_config_path, exc)
 
@@ -98,27 +116,26 @@ def uninstall(brain_dir: Path, agent_config_path: Path) -> InstallResult:
         hooks = data.get("hooks")
         if not isinstance(hooks, dict):
             return InstallResult(AGENT, agent_config_path, "already_present", "no hooks block")
-        pre_tool = hooks.get("PreToolUse")
-        if not isinstance(pre_tool, list):
-            return InstallResult(AGENT, agent_config_path, "already_present", "no PreToolUse")
-
         removed = 0
-        kept: list = []
-        for entry in pre_tool:
-            entry_str = str(entry)
-            if sig in entry_str:
-                # Either the entry's `hooks[].id` carries our sig, or the
-                # whole entry was ours. Drop it.
-                removed += 1
+        for lifecycle in ("PreToolUse", "PreCompact"):
+            entries = hooks.get(lifecycle)
+            if not isinstance(entries, list):
                 continue
-            kept.append(entry)
+            kept: list = []
+            for entry in entries:
+                entry_str = str(entry)
+                if sig in entry_str:
+                    # Either the entry's `hooks[].id` carries our sig, or the
+                    # whole entry was ours. Drop it.
+                    removed += 1
+                    continue
+                kept.append(entry)
+            if kept:
+                hooks[lifecycle] = kept
+            else:
+                hooks.pop(lifecycle, None)
         if removed == 0:
             return InstallResult(AGENT, agent_config_path, "already_present", "hook not present")
-
-        if kept:
-            hooks["PreToolUse"] = kept
-        else:
-            hooks.pop("PreToolUse", None)
         if not hooks:
             data.pop("hooks", None)
         write_json(agent_config_path, data)

diff --git a/Gradata/src/gradata/hooks/pre_compact.py b/Gradata/src/gradata/hooks/pre_compact.py
@@ -1,68 +1,125 @@
-"""PreCompact hook: save brain state snapshot before context compaction."""
+"""Claude Code PreCompact hook: snapshot bounded Gradata context before compaction."""
 
 from __future__ import annotations
 
 import hashlib
 import json
-import os
-import tempfile
-from datetime import UTC, datetime
+import re
+import time
 from pathlib import Path
+from typing import Any
 
+from gradata._atomic import atomic_write_text
 from gradata.hooks._base import resolve_brain_dir, run_hook
 from gradata.hooks._profiles import Profile
 
 HOOK_META = {
     "event": "PreCompact",
     "matcher": "manual|auto",
-    "profile": Profile.STANDARD,
+    "profile": Profile.MINIMAL,
     "timeout": 5000,
 }
+_MAX_TEXT_BYTES = 64_000
+_MAX_JSON_BYTES = 128_000
 
 
-def main(data: dict) -> dict | None:
+def _safe_filename(value: object) -> str:
+    raw = str(value or "").strip()
+    if not raw:
+        raw = f"precompact-{int(time.time() * 1000)}"
+    safe = re.sub(r"[^A-Za-z0-9_.-]+", "-", raw).strip(".-")
+    if not safe:
+        safe = hashlib.sha256(raw.encode("utf-8", errors="replace")).hexdigest()[:16]
+    return safe[:120]
+
+
+def _session_id(data: dict[str, Any]) -> str:
+    for key in ("session_id", "sessionId", "conversation_id", "conversationId"):
+        value = data.get(key)
+        if isinstance(value, str) and value.strip():
+            return value.strip()
+    encoded = json.dumps(data, sort_keys=True, default=str)
+    return hashlib.sha256(encoded.encode("utf-8", errors="replace")).hexdigest()[:16]
+
+
+def _read_bounded(path: Path, *, limit: int = _MAX_TEXT_BYTES) -> str | None:
     try:
-        brain_dir_str = resolve_brain_dir()
-        if not brain_dir_str:
+        if not path.is_file():
             return None
-        brain_dir = Path(brain_dir_str)
-
-        compact_type = data.get("type", "unknown") if data else "unknown"
-
-        snapshot = {
-            "timestamp": datetime.now(UTC).isoformat(),
-            "compact_type": compact_type,
-            "brain_dir": str(brain_dir),
-        }
-
-        # Include lesson count if available
-        lessons_path = brain_dir / "lessons.md"
-        if lessons_path.is_file():
-            text = lessons_path.read_text(encoding="utf-8")
-            snapshot["lesson_count"] = len(
-                [
-                    line
-                    for line in text.splitlines()
-                    if (stripped := line.strip()) and not stripped.startswith("#")
-                ]
-            )
-
-        if hasattr(os, "getuid"):
-            uid = os.getuid()
-        else:
-            try:
-                uid = os.getlogin()
-            except OSError:
-                uid = f"pid{os.getpid()}"
-        user_tmp = Path(tempfile.gettempdir()) / f"gradata-{uid}"
-        user_tmp.mkdir(parents=True, exist_ok=True)
-        dir_hash = hashlib.md5(str(brain_dir).encode()).hexdigest()[:8]
-        snapshot_path = user_tmp / f"compact-snapshot-{dir_hash}.json"
-        snapshot_path.write_text(json.dumps(snapshot, indent=2), encoding="utf-8")
-
-        return {"result": "State saved before compaction"}
-    except Exception:
+        data = path.read_bytes()[:limit]
+        return data.decode("utf-8", errors="replace")
+    except OSError:
+        return None
+
+
+def _snapshot_path(brain_dir: Path, session_id: str) -> Path:
+    return brain_dir / ".precompact-snapshots" / f"{_safe_filename(session_id)}.json"
+
+
+def _compact_payload(data: dict[str, Any]) -> dict[str, Any]:
+    keep = (
+        "hook_event_name",
+        "session_id",
+        "sessionId",
+        "transcript_path",
+        "cwd",
+        "trigger",
+        "custom_instructions",
+        "model",
+    )
+    return {key: data[key] for key in keep if key in data}
+
+
+def _build_snapshot(brain_dir: Path, data: dict[str, Any]) -> dict[str, Any]:
+    session_id = _session_id(data)
+    relevant_context: dict[str, Any] = {}
+
+    brain_prompt = _read_bounded(brain_dir / "brain_prompt.md")
+    if brain_prompt is not None:
+        relevant_context["brain_prompt_md"] = brain_prompt
+
+    last_injection = _read_bounded(brain_dir / ".last_injection.json", limit=_MAX_JSON_BYTES)
+    if last_injection is not None:
+        try:
+            relevant_context["last_injection"] = json.loads(last_injection)
+        except json.JSONDecodeError:
+            relevant_context["last_injection_raw"] = last_injection
+
+    return {
+        "schema_version": 1,
+        "created_at": time.time(),
+        "event": "PreCompact",
+        "session_id": session_id,
+        "trigger": data.get("trigger"),
+        "cwd": data.get("cwd"),
+        "transcript_path": data.get("transcript_path"),
+        "custom_instructions": data.get("custom_instructions"),
+        "brain_dir": str(brain_dir),
+        "payload": _compact_payload(data),
+        "relevant_context": relevant_context,
+        "limits": {
+            "max_text_bytes": _MAX_TEXT_BYTES,
+            "max_json_bytes": _MAX_JSON_BYTES,
+            "transcript_content_captured": False,
+        },
+    }
+
+
+def _write_snapshot(path: Path, snapshot: dict[str, Any]) -> None:
+    path.parent.mkdir(parents=True, exist_ok=True)
+    atomic_write_text(path, json.dumps(snapshot, indent=2, sort_keys=True) + "\n")
+
+
+def main(data: dict[str, Any]) -> None:
+    resolved = resolve_brain_dir()
+    if not resolved:
+        return None
+    brain_dir = Path(resolved)
+    if not brain_dir.exists():
         return None
+    session_id = _session_id(data)
+    _write_snapshot(_snapshot_path(brain_dir, session_id), _build_snapshot(brain_dir, data))
-    if not brain_dir.exists():
-        return None
-    session_id = _session_id(data)
-    _write_snapshot(_snapshot_path(brain_dir, session_id), _build_snapshot(brain_dir, data))
+    if not brain_dir.is_dir():
+        return None
+    session_id = _session_id(data)
+    _write_snapshot(_snapshot_path(brain_dir, session_id), _build_snapshot(brain_dir, data))
-    if not brain_dir.exists():
-        return None
-    session_id = _session_id(data)
-    _write_snapshot(_snapshot_path(brain_dir, session_id), _build_snapshot(brain_dir, data))
+    if not brain_dir.is_dir():
+        return None
+    session_id = _session_id(data)
+    _write_snapshot(_snapshot_path(brain_dir, session_id), _build_snapshot(brain_dir, data))
+    return None
 
 
 if __name__ == "__main__":

diff --git a/Gradata/tests/test_hook_adapters.py b/Gradata/tests/test_hook_adapters.py
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+import json
 import os
 import tomllib
 from pathlib import Path
@@ -63,3 +64,26 @@ def test_adapter_install_does_not_touch_real_user_config(tmp_path: Path) -> None
     assert result.action == "added"
     after = real_config.read_text(encoding="utf-8") if real_config.exists() else None
     assert after == before
+
+
+def test_claude_code_install_writes_pre_compact_entry(tmp_path: Path) -> None:
+    brain_dir = tmp_path / "brain"
+    brain_dir.mkdir()
+    config_path = tmp_path / ".claude" / "settings.json"
+
+    adapter = get_adapter("claude-code")
+    first = adapter.install(brain_dir, config_path)
+    second = adapter.install(brain_dir, config_path)
+
+    assert first.action == "added"
+    assert second.action == "already_present"
+    settings = json.loads(config_path.read_text(encoding="utf-8"))
+    pre_compact = settings["hooks"]["PreCompact"]
+    commands = [
+        hook.get("command", "")
+        for entry in pre_compact
+        for hook in entry.get("hooks", [])
+    ]
+    assert len(pre_compact) == 1
+    assert any("BRAIN_DIR=" in command for command in commands)
+    assert any("gradata.hooks.pre_compact" in command for command in commands)
-    assert any("BRAIN_DIR=" in command for command in commands)
-    assert any("gradata.hooks.pre_compact" in command for command in commands)
+    assert any(
+        "BRAIN_DIR=" in command and "gradata.hooks.pre_compact" in command
+        for command in commands
+    )
-    assert any("BRAIN_DIR=" in command for command in commands)
-    assert any("gradata.hooks.pre_compact" in command for command in commands)
+    assert any(
+        "BRAIN_DIR=" in command and "gradata.hooks.pre_compact" in command
+        for command in commands
+    )