memory-search: chunk context output for hook delivery

Claude Code's hook output limit (~10K chars) was truncating the full context load. Split output into chunks at section boundaries, deliver first chunk on UserPromptSubmit, save remaining chunks to disk for drip-feeding on subsequent PostToolUse calls. Two-pass algorithm: split at "--- KEY (group) ---" boundaries, then merge adjacent small sections up to 9K per chunk. Separates session_id guard (needed for chunk state) from prompt guard (needed only for search), so PostToolUse events without a prompt can still pop chunks.
2026-03-09 17:56:59 -04:00 · 2026-03-09 17:56:59 -04:00 · d5554db6a8
commit d5554db6a8
parent 32d17997af
1 changed files with 112 additions and 7 deletions
--- a/poc-memory/src/bin/memory-search.rs
+++ b/poc-memory/src/bin/memory-search.rs
@ -45,6 +45,8 @@ struct Args {
 }
 const STASH_PATH: &str = "/tmp/claude-memory-search/last-input.json";
 /// Max bytes per context chunk (hook output limit is ~10K chars)
 const CHUNK_SIZE: usize = 9000;
 fn main() {
    // Daemon agent calls set POC_AGENT=1 — skip memory search.
@ -84,7 +86,7 @@ fn main() {
    let prompt = json["prompt"].as_str().unwrap_or("");
    let session_id = json["session_id"].as_str().unwrap_or("");
-    if prompt.is_empty() || session_id.is_empty() {
+    if session_id.is_empty() {
        return;
    }
@ -123,12 +125,12 @@ fn main() {
        if debug { println!("[memory-search] loading full context"); }
-        // Load full memory context and pre-populate seen set with injected keys
+        // Load full memory context, chunk it, print first chunk, save rest
        if let Ok(output) = Command::new("poc-memory").args(["load-context"]).output() {
            if output.status.success() {
-                let ctx = String::from_utf8_lossy(&output.stdout);
+                let ctx = String::from_utf8_lossy(&output.stdout).to_string();
                if !ctx.trim().is_empty() {
-                    // Extract keys from "--- KEY (group) ---" lines
+                    // Extract keys from all chunks for seen set
                    for line in ctx.lines() {
                        if line.starts_with("--- ") && line.ends_with(" ---") {
                            let inner = &line[4..line.len() - 4];
@ -138,15 +140,42 @@ fn main() {
                            }
                        }
                    }
-                    if debug { println!("[memory-search] context loaded: {} bytes", ctx.len()); }
+
-                    if args.hook {
+                    let chunks = chunk_context(&ctx, CHUNK_SIZE);
-                        print!("{}", ctx);
+                    if debug {
                        println!("[memory-search] context: {} bytes, {} chunks",
                            ctx.len(), chunks.len());
                    }
                    // Print first chunk
                    if let Some(first) = chunks.first() {
                        if args.hook {
                            print!("{}", first);
                        }
                    }
                    // Save remaining chunks for drip-feeding
                    save_pending_chunks(&state_dir, session_id, &chunks[1..]);
                }
            }
        }
        let _ = cookie;
    } else {
        // Not first call: drip-feed next pending chunk
        if let Some(chunk) = pop_pending_chunk(&state_dir, session_id) {
            if debug {
                println!("[memory-search] drip-feeding pending chunk: {} bytes", chunk.len());
            }
            if args.hook {
                print!("{}", chunk);
            }
        }
    }
    // Search requires a prompt (PostToolUse events don't have one)
    if prompt.is_empty() {
        return;
    }
    // Skip system/AFK prompts
@ -288,6 +317,82 @@ fn main() {
 }
 /// Split context output into chunks of approximately `max_bytes`, breaking
 /// at section boundaries ("--- KEY (group) ---" lines).
 fn chunk_context(ctx: &str, max_bytes: usize) -> Vec<String> {
    // Split into sections at group boundaries, then merge small adjacent
    // sections into chunks up to max_bytes.
    let mut sections: Vec<String> = Vec::new();
    let mut current = String::new();
    for line in ctx.lines() {
        // Group headers start new sections
        if line.starts_with("--- ") && line.ends_with(" ---") && !current.is_empty() {
            sections.push(std::mem::take(&mut current));
        }
        if !current.is_empty() {
            current.push('\n');
        }
        current.push_str(line);
    }
    if !current.is_empty() {
        sections.push(current);
    }
    // Merge small sections into chunks, respecting max_bytes
    let mut chunks: Vec<String> = Vec::new();
    let mut chunk = String::new();
    for section in sections {
        if !chunk.is_empty() && chunk.len() + section.len() + 1 > max_bytes {
            chunks.push(std::mem::take(&mut chunk));
        }
        if !chunk.is_empty() {
            chunk.push('\n');
        }
        chunk.push_str(&section);
    }
    if !chunk.is_empty() {
        chunks.push(chunk);
    }
    chunks
 }
 /// Save remaining chunks to disk for drip-feeding on subsequent hook calls.
 fn save_pending_chunks(dir: &Path, session_id: &str, chunks: &[String]) {
    let chunks_dir = dir.join(format!("chunks-{}", session_id));
    // Clear any old chunks
    let _ = fs::remove_dir_all(&chunks_dir);
    if chunks.is_empty() { return; }
    fs::create_dir_all(&chunks_dir).ok();
    for (i, chunk) in chunks.iter().enumerate() {
        let path = chunks_dir.join(format!("{:04}", i));
        fs::write(path, chunk).ok();
    }
 }
 /// Pop the next pending chunk (lowest numbered file). Returns None if no chunks remain.
 fn pop_pending_chunk(dir: &Path, session_id: &str) -> Option<String> {
    let chunks_dir = dir.join(format!("chunks-{}", session_id));
    if !chunks_dir.exists() { return None; }
    let mut entries: Vec<_> = fs::read_dir(&chunks_dir).ok()?
        .flatten()
        .filter(|e| e.file_type().map(|t| t.is_file()).unwrap_or(false))
        .collect();
    entries.sort_by_key(|e| e.file_name());
    let first = entries.first()?;
    let content = fs::read_to_string(first.path()).ok()?;
    fs::remove_file(first.path()).ok();
    // Clean up directory if empty
    if fs::read_dir(&chunks_dir).ok().map(|mut d| d.next().is_none()).unwrap_or(true) {
        fs::remove_dir(&chunks_dir).ok();
    }
    Some(content)
 }
 /// Reverse-scan the transcript JSONL, extracting text from user/assistant
 /// messages until we accumulate `max_tokens` tokens of text content.
 /// Then search for all node keys as substrings, weighted by position.