consciousness/src/thought/context.rs

// context.rs — Context window management
//
// Token counting, conversation trimming, and error classification.
// Journal entries are loaded from the memory graph store, not from
// a flat file — the parse functions are gone.

use crate::agent::types::*;
use chrono::{DateTime, Utc};
use tiktoken_rs::CoreBPE;

/// A single journal entry with its timestamp and content.
#[derive(Debug, Clone)]
pub struct JournalEntry {
    pub timestamp: DateTime<Utc>,
    pub content: String,
}

/// Look up a model's context window size in tokens.
pub fn model_context_window(_model: &str) -> usize {
    crate::config::get().api_context_window
}

/// Context budget in tokens: 60% of the model's context window.
fn context_budget_tokens(model: &str) -> usize {
    model_context_window(model) * 60 / 100
}

/// Trim conversation to fit within the context budget.
/// Returns the trimmed conversation messages (oldest dropped first).
pub fn trim_conversation(
    context: &ContextState,
    conversation: &[Message],
    model: &str,
    tokenizer: &CoreBPE,
) -> Vec<Message> {
    let count = |s: &str| tokenizer.encode_with_special_tokens(s).len();
    let max_tokens = context_budget_tokens(model);

    let identity_cost = count(&context.system_prompt)
        + context.personality.iter().map(|(_, c)| count(c)).sum::<usize>();
    let journal_cost: usize = context.journal.iter().map(|e| count(&e.content)).sum();
    let reserve = max_tokens / 4;
    let available = max_tokens
        .saturating_sub(identity_cost)
        .saturating_sub(journal_cost)
        .saturating_sub(reserve);

    let msg_costs: Vec<usize> = conversation.iter()
        .map(|m| msg_token_count(tokenizer, m)).collect();
    let total: usize = msg_costs.iter().sum();

    let mut skip = 0;
    let mut trimmed = total;
    while trimmed > available && skip < conversation.len() {
        trimmed -= msg_costs[skip];
        skip += 1;
    }

    // Walk forward to user message boundary
    while skip < conversation.len() && conversation[skip].role != Role::User {
        skip += 1;
    }

    conversation[skip..].to_vec()
}

/// Count the token footprint of a message using BPE tokenization.
pub fn msg_token_count(tokenizer: &CoreBPE, msg: &Message) -> usize {
    let count = |s: &str| tokenizer.encode_with_special_tokens(s).len();
    let content = msg.content.as_ref().map_or(0, |c| match c {
        MessageContent::Text(s) => count(s),
        MessageContent::Parts(parts) => parts.iter()
            .map(|p| match p {
                ContentPart::Text { text } => count(text),
                ContentPart::ImageUrl { .. } => 85,
            })
            .sum(),
    });
    let tools = msg.tool_calls.as_ref().map_or(0, |calls| {
        calls.iter()
            .map(|c| count(&c.function.arguments) + count(&c.function.name))
            .sum()
    });
    content + tools
}

/// Detect context window overflow errors from the API.
pub fn is_context_overflow(err: &anyhow::Error) -> bool {
    let msg = err.to_string().to_lowercase();
    msg.contains("context length")
        || msg.contains("token limit")
        || msg.contains("too many tokens")
        || msg.contains("maximum context")
        || msg.contains("prompt is too long")
        || msg.contains("request too large")
        || msg.contains("input validation error")
        || msg.contains("content length limit")
        || (msg.contains("400") && msg.contains("tokens"))
}

/// Detect model/provider errors delivered inside the SSE stream.
pub fn is_stream_error(err: &anyhow::Error) -> bool {
    err.to_string().contains("model stream error")
}
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`// context.rs — Context window management`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`//`
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`// Token counting, conversation trimming, and error classification.`
			`// Journal entries are loaded from the memory graph store, not from`
			`// a flat file — the parse functions are gone.`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00
			`use crate::agent::types::*;`
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`use chrono::{DateTime, Utc};`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`use tiktoken_rs::CoreBPE;`
move journal types from agent/journal.rs to thought/context.rs JournalEntry, parse_journal, parse_journal_text, parse_header_timestamp, and default_journal_path consolidated into thought/context.rs. Delete the duplicate agent/journal.rs (235 lines). Update all references. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:25:07 -04:00
			`/// A single journal entry with its timestamp and content.`
			`#[derive(Debug, Clone)]`
			`pub struct JournalEntry {`
			`pub timestamp: DateTime<Utc>,`
			`pub content: String,`
			`}`

thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`/// Look up a model's context window size in tokens.`
cleanup: remove model name string matching model_context_window() now reads from config.api_context_window instead of guessing from model name strings. is_anthropic_model() replaced with backend == "anthropic" checks. Dead model field removed from AgentDef/AgentHeader. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 14:09:54 -04:00			`pub fn model_context_window(_model: &str) -> usize {`
			`crate::config::get().api_context_window`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`}`

			`/// Context budget in tokens: 60% of the model's context window.`
			`fn context_budget_tokens(model: &str) -> usize {`
			`model_context_window(model) * 60 / 100`
			`}`

delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`/// Trim conversation to fit within the context budget.`
			`/// Returns the trimmed conversation messages (oldest dropped first).`
			`pub fn trim_conversation(`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`context: &ContextState,`
			`conversation: &[Message],`
			`model: &str,`
			`tokenizer: &CoreBPE,`
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`) -> Vec<Message> {`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`let count = \|s: &str\| tokenizer.encode_with_special_tokens(s).len();`
			`let max_tokens = context_budget_tokens(model);`

delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`let identity_cost = count(&context.system_prompt)`
			`+ context.personality.iter().map(\|(_, c)\| count(c)).sum::<usize>();`
			`let journal_cost: usize = context.journal.iter().map(\|e\| count(&e.content)).sum();`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`let reserve = max_tokens / 4;`
			`let available = max_tokens`
			`.saturating_sub(identity_cost)`
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`.saturating_sub(journal_cost)`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`.saturating_sub(reserve);`

delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`let msg_costs: Vec<usize> = conversation.iter()`
			`.map(\|m\| msg_token_count(tokenizer, m)).collect();`
			`let total: usize = msg_costs.iter().sum();`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`let mut skip = 0;`
			`let mut trimmed = total;`
			`while trimmed > available && skip < conversation.len() {`
			`trimmed -= msg_costs[skip];`
			`skip += 1;`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`}`

			`// Walk forward to user message boundary`
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`while skip < conversation.len() && conversation[skip].role != Role::User {`
			`skip += 1;`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`}`

delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`conversation[skip..].to_vec()`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`}`

delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`/// Count the token footprint of a message using BPE tokenization.`
			`pub fn msg_token_count(tokenizer: &CoreBPE, msg: &Message) -> usize {`
			`let count = \|s: &str\| tokenizer.encode_with_special_tokens(s).len();`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`let content = msg.content.as_ref().map_or(0, \|c\| match c {`
			`MessageContent::Text(s) => count(s),`
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`MessageContent::Parts(parts) => parts.iter()`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`.map(\|p\| match p {`
			`ContentPart::Text { text } => count(text),`
			`ContentPart::ImageUrl { .. } => 85,`
			`})`
			`.sum(),`
			`});`
			`let tools = msg.tool_calls.as_ref().map_or(0, \|calls\| {`
delete dead flat-file journal code from thought/context.rs Journal entries are loaded from the memory graph store, not from the flat journal file. Remove build_context_window, plan_context, render_journal_text, assemble_context, truncate_at_section, find_journal_cutoff, parse_journal*, ContextPlan, and stale TODOs. Keep JournalEntry, default_journal_path (write path), and the live context management functions. -363 lines. Co-Authored-By: Proof of Concept <poc@bcachefs.org> 2026-04-02 15:31:12 -04:00			`calls.iter()`
thought: create shared cognitive substrate module New src/thought/ module containing tools and infrastructure shared between poc-agent and subconscious agents: memory operations, file tools, bash, context window management. Currently coexists with agent/tools/ — next step is to wire up both agent/ and subconscious/ to use thought::dispatch instead of duplicating the routing logic. Move dbglog macro to lib.rs so it's available crate-wide regardless of module compilation order. 2026-03-27 15:22:48 -04:00			`.map(\|c\| count(&c.function.arguments) + count(&c.function.name))`
			`.sum()`
			`});`
			`content + tools`
			`}`

			`/// Detect context window overflow errors from the API.`
			`pub fn is_context_overflow(err: &anyhow::Error) -> bool {`
			`let msg = err.to_string().to_lowercase();`
			`msg.contains("context length")`
			`\|\| msg.contains("token limit")`
			`\|\| msg.contains("too many tokens")`
			`\|\| msg.contains("maximum context")`
			`\|\| msg.contains("prompt is too long")`
			`\|\| msg.contains("request too large")`
			`\|\| msg.contains("input validation error")`
			`\|\| msg.contains("content length limit")`
			`\|\| (msg.contains("400") && msg.contains("tokens"))`
			`}`

			`/// Detect model/provider errors delivered inside the SSE stream.`
			`pub fn is_stream_error(err: &anyhow::Error) -> bool {`
			`err.to_string().contains("model stream error")`
			`}`