unify conversation persistence to append-only jsonl
Log ConversationEntry (with Memory/Message typing) instead of raw Message. restore_from_log reads typed entries directly, preserving Memory vs Message distinction across restarts. Remove current.json snapshot and save_session — the append-only log is the single source of truth. Remove dead read_all and message_count methods. Add push_entry for logging typed entries. Co-Authored-By: Proof of Concept <poc@bcachefs.org>
This commit is contained in:
parent
1f7b585d41
commit
a21cf31ad2
3 changed files with 47 additions and 125 deletions
|
|
@ -14,7 +14,7 @@ use std::fs::{File, OpenOptions};
|
|||
use std::io::{BufRead, BufReader, Seek, SeekFrom, Write};
|
||||
use std::path::{Path, PathBuf};
|
||||
|
||||
use crate::agent::types::Message;
|
||||
use crate::agent::types::ConversationEntry;
|
||||
|
||||
pub struct ConversationLog {
|
||||
path: PathBuf,
|
||||
|
|
@ -30,16 +30,16 @@ impl ConversationLog {
|
|||
Ok(Self { path })
|
||||
}
|
||||
|
||||
/// Append a single message to the log.
|
||||
pub fn append(&self, msg: &Message) -> Result<()> {
|
||||
/// Append a conversation entry to the log.
|
||||
pub fn append(&self, entry: &ConversationEntry) -> Result<()> {
|
||||
let mut file = OpenOptions::new()
|
||||
.create(true)
|
||||
.append(true)
|
||||
.open(&self.path)
|
||||
.with_context(|| format!("opening log {}", self.path.display()))?;
|
||||
|
||||
let line = serde_json::to_string(msg)
|
||||
.context("serializing message for log")?;
|
||||
let line = serde_json::to_string(entry)
|
||||
.context("serializing entry for log")?;
|
||||
writeln!(file, "{}", line)
|
||||
.context("writing to conversation log")?;
|
||||
Ok(())
|
||||
|
|
@ -48,7 +48,7 @@ impl ConversationLog {
|
|||
/// Read the tail of the log (last `max_bytes` bytes).
|
||||
/// Seeks to `file_len - max_bytes`, skips the first partial line,
|
||||
/// then parses forward. For logs smaller than `max_bytes`, reads everything.
|
||||
pub fn read_tail(&self, max_bytes: u64) -> Result<Vec<Message>> {
|
||||
pub fn read_tail(&self, max_bytes: u64) -> Result<Vec<ConversationEntry>> {
|
||||
if !self.path.exists() {
|
||||
return Ok(Vec::new());
|
||||
}
|
||||
|
|
@ -64,62 +64,19 @@ impl ConversationLog {
|
|||
reader.read_line(&mut discard)?;
|
||||
}
|
||||
|
||||
let mut messages = Vec::new();
|
||||
let mut entries = Vec::new();
|
||||
for line in reader.lines() {
|
||||
let line = line.context("reading log tail")?;
|
||||
let line = line.trim();
|
||||
if line.is_empty() {
|
||||
continue;
|
||||
}
|
||||
match serde_json::from_str::<Message>(line) {
|
||||
Ok(msg) => messages.push(msg),
|
||||
Err(_) => {} // skip corrupt/partial lines
|
||||
// Try ConversationEntry first (new format), fall back to bare Message (old logs)
|
||||
if let Ok(entry) = serde_json::from_str::<ConversationEntry>(line) {
|
||||
entries.push(entry);
|
||||
}
|
||||
}
|
||||
Ok(messages)
|
||||
}
|
||||
|
||||
/// Count messages in the log without loading content.
|
||||
#[allow(dead_code)]
|
||||
pub fn message_count(&self) -> Result<usize> {
|
||||
if !self.path.exists() {
|
||||
return Ok(0);
|
||||
}
|
||||
let file = File::open(&self.path)
|
||||
.with_context(|| format!("opening log {}", self.path.display()))?;
|
||||
let reader = BufReader::new(file);
|
||||
Ok(reader.lines()
|
||||
.filter(|l| l.as_ref().map_or(false, |s| !s.trim().is_empty()))
|
||||
.count())
|
||||
}
|
||||
|
||||
/// Read all messages from the log. Returns empty vec if log doesn't exist.
|
||||
/// NOTE: Don't use this in hot paths — use read_tail() instead.
|
||||
#[allow(dead_code)]
|
||||
pub fn read_all(&self) -> Result<Vec<Message>> {
|
||||
if !self.path.exists() {
|
||||
return Ok(Vec::new());
|
||||
}
|
||||
let file = File::open(&self.path)
|
||||
.with_context(|| format!("opening log {}", self.path.display()))?;
|
||||
let reader = BufReader::new(file);
|
||||
let mut messages = Vec::new();
|
||||
|
||||
for (i, line) in reader.lines().enumerate() {
|
||||
let line = line.with_context(|| format!("reading log line {}", i))?;
|
||||
let line = line.trim();
|
||||
if line.is_empty() {
|
||||
continue;
|
||||
}
|
||||
match serde_json::from_str::<Message>(line) {
|
||||
Ok(msg) => messages.push(msg),
|
||||
Err(e) => {
|
||||
// Log corruption — skip bad lines rather than failing
|
||||
eprintln!("warning: skipping corrupt log line {}: {}", i, e);
|
||||
}
|
||||
}
|
||||
}
|
||||
Ok(messages)
|
||||
Ok(entries)
|
||||
}
|
||||
|
||||
pub fn path(&self) -> &Path {
|
||||
|
|
@ -133,8 +90,8 @@ impl ConversationLog {
|
|||
for line in reader.lines().flatten() {
|
||||
let line = line.trim().to_string();
|
||||
if line.is_empty() { continue; }
|
||||
if let Ok(msg) = serde_json::from_str::<Message>(&line) {
|
||||
if let Some(ts) = &msg.timestamp {
|
||||
if let Ok(entry) = serde_json::from_str::<ConversationEntry>(&line) {
|
||||
if let Some(ts) = &entry.message().timestamp {
|
||||
if let Ok(dt) = chrono::DateTime::parse_from_rfc3339(ts) {
|
||||
return Some(dt.to_utc());
|
||||
}
|
||||
|
|
|
|||
|
|
@ -168,12 +168,17 @@ impl Agent {
|
|||
/// Push a conversation message — stamped and logged.
|
||||
fn push_message(&mut self, mut msg: Message) {
|
||||
msg.stamp();
|
||||
let entry = ConversationEntry::Message(msg);
|
||||
self.push_entry(entry);
|
||||
}
|
||||
|
||||
fn push_entry(&mut self, entry: ConversationEntry) {
|
||||
if let Some(ref log) = self.conversation_log {
|
||||
if let Err(e) = log.append(&msg) {
|
||||
eprintln!("warning: failed to log message: {:#}", e);
|
||||
if let Err(e) = log.append(&entry) {
|
||||
eprintln!("warning: failed to log entry: {:#}", e);
|
||||
}
|
||||
}
|
||||
self.context.entries.push(ConversationEntry::Message(msg));
|
||||
self.context.entries.push(entry);
|
||||
}
|
||||
|
||||
/// Push a context-only message (system prompt, identity context,
|
||||
|
|
@ -1000,11 +1005,11 @@ impl Agent {
|
|||
self.context.system_prompt = system_prompt;
|
||||
self.context.personality = personality;
|
||||
|
||||
let all_messages = match &self.conversation_log {
|
||||
let entries = match &self.conversation_log {
|
||||
Some(log) => match log.read_tail(512 * 1024) {
|
||||
Ok(msgs) if !msgs.is_empty() => {
|
||||
dbglog!("[restore] read {} messages from log tail", msgs.len());
|
||||
msgs
|
||||
Ok(entries) if !entries.is_empty() => {
|
||||
dbglog!("[restore] read {} entries from log tail", entries.len());
|
||||
entries
|
||||
}
|
||||
Ok(_) => {
|
||||
dbglog!("[restore] log exists but is empty");
|
||||
|
|
@ -1021,29 +1026,31 @@ impl Agent {
|
|||
}
|
||||
};
|
||||
|
||||
// Filter out system/context messages — we only want the
|
||||
// actual conversation (user prompts, assistant responses,
|
||||
// tool calls/results)
|
||||
let conversation: Vec<Message> = all_messages
|
||||
// Filter out system messages, keep everything else (including Memory entries)
|
||||
let entries: Vec<ConversationEntry> = entries
|
||||
.into_iter()
|
||||
.filter(|m| m.role != Role::System)
|
||||
.filter(|e| e.message().role != Role::System)
|
||||
.collect();
|
||||
dbglog!("[restore] {} messages after filtering system", conversation.len());
|
||||
|
||||
let messages = crate::agent::context::trim_conversation(
|
||||
// Trim to fit context budget
|
||||
let n = entries.len();
|
||||
let conversation: Vec<Message> = entries.iter()
|
||||
.map(|e| e.api_message().clone()).collect();
|
||||
let trimmed = crate::agent::context::trim_conversation(
|
||||
&self.context,
|
||||
&conversation,
|
||||
&self.client.model,
|
||||
&self.tokenizer,
|
||||
);
|
||||
dbglog!("[restore] journal preserved: {} entries",
|
||||
self.context.journal.len());
|
||||
// Don't overwrite journal — already loaded from memory graph
|
||||
self.context.entries = messages.into_iter()
|
||||
.map(ConversationEntry::Message).collect();
|
||||
dbglog!("[restore] built context window: {} entries", self.context.entries.len());
|
||||
// Keep only the entries that survived trimming (by count from the end)
|
||||
let keep = trimmed.len();
|
||||
self.context.entries = entries.into_iter()
|
||||
.skip(n.saturating_sub(keep))
|
||||
.collect();
|
||||
|
||||
dbglog!("[restore] {} entries, journal: {} entries",
|
||||
self.context.entries.len(), self.context.journal.len());
|
||||
self.last_prompt_tokens = 0;
|
||||
|
||||
self.publish_context_state();
|
||||
true
|
||||
}
|
||||
|
|
@ -1068,10 +1075,6 @@ impl Agent {
|
|||
&mut self.context.entries
|
||||
}
|
||||
|
||||
/// Restore from saved conversation entries.
|
||||
pub fn restore(&mut self, entries: Vec<ConversationEntry>) {
|
||||
self.context.entries = entries;
|
||||
}
|
||||
}
|
||||
|
||||
// Context window building, token counting, and error classification
|
||||
|
|
|
|||
|
|
@ -24,7 +24,6 @@
|
|||
use anyhow::Result;
|
||||
use crossterm::event::{Event, EventStream, KeyEventKind};
|
||||
use futures::StreamExt;
|
||||
use std::path::PathBuf;
|
||||
use std::sync::Arc;
|
||||
use std::time::{Duration, Instant};
|
||||
use tokio::sync::{mpsc, Mutex};
|
||||
|
|
@ -124,8 +123,6 @@ struct Session {
|
|||
process_tracker: tools::ProcessTracker,
|
||||
ui_tx: ui_channel::UiSender,
|
||||
turn_tx: mpsc::Sender<(Result<TurnResult>, StreamTarget)>,
|
||||
session_file: PathBuf,
|
||||
|
||||
// DMN state
|
||||
dmn: dmn::State,
|
||||
dmn_turns: u32,
|
||||
|
|
@ -153,7 +150,6 @@ impl Session {
|
|||
process_tracker: tools::ProcessTracker,
|
||||
ui_tx: ui_channel::UiSender,
|
||||
turn_tx: mpsc::Sender<(Result<TurnResult>, StreamTarget)>,
|
||||
session_file: PathBuf,
|
||||
) -> Self {
|
||||
let max_dmn_turns = config.app.dmn.max_turns;
|
||||
|
||||
|
|
@ -163,7 +159,6 @@ impl Session {
|
|||
process_tracker,
|
||||
ui_tx,
|
||||
turn_tx,
|
||||
session_file,
|
||||
dmn: if dmn::is_off() {
|
||||
dmn::State::Off
|
||||
} else {
|
||||
|
|
@ -321,8 +316,6 @@ impl Session {
|
|||
.to_string(),
|
||||
);
|
||||
}
|
||||
|
||||
let _ = save_session(&agent_guard, &self.session_file);
|
||||
}
|
||||
|
||||
/// Send any consolidated pending input as a single turn.
|
||||
|
|
@ -398,14 +391,9 @@ impl Session {
|
|||
match input {
|
||||
"/quit" | "/exit" => Command::Quit,
|
||||
"/save" => {
|
||||
if let Ok(agent) = self.agent.try_lock() {
|
||||
let _ = save_session(&agent, &self.session_file);
|
||||
let _ = self.ui_tx.send(UiMessage::Info("Session saved.".into()));
|
||||
} else {
|
||||
let _ = self
|
||||
.ui_tx
|
||||
.send(UiMessage::Info("(busy — will save after turn)".into()));
|
||||
}
|
||||
let _ = self.ui_tx.send(UiMessage::Info(
|
||||
"Conversation is saved automatically (append-only log).".into()
|
||||
));
|
||||
Command::Handled
|
||||
}
|
||||
"/new" | "/clear" => {
|
||||
|
|
@ -415,10 +403,6 @@ impl Session {
|
|||
.send(UiMessage::Info("(turn in progress, please wait)".into()));
|
||||
return Command::Handled;
|
||||
}
|
||||
{
|
||||
let agent_guard = self.agent.lock().await;
|
||||
let _ = save_session(&agent_guard, &self.session_file);
|
||||
}
|
||||
{
|
||||
let new_log = log::ConversationLog::new(
|
||||
self.config.session_dir.join("conversation.jsonl"),
|
||||
|
|
@ -516,7 +500,6 @@ impl Session {
|
|||
)));
|
||||
}
|
||||
}
|
||||
let _ = save_session(&agent_guard, &self.session_file);
|
||||
self.dmn = dmn::State::Resting {
|
||||
since: Instant::now(),
|
||||
};
|
||||
|
|
@ -861,8 +844,6 @@ impl Session {
|
|||
if let Some(handle) = self.turn_handle.take() {
|
||||
handle.abort();
|
||||
}
|
||||
let agent = self.agent.lock().await;
|
||||
let _ = save_session(&agent, &self.session_file);
|
||||
}
|
||||
}
|
||||
|
||||
|
|
@ -927,29 +908,17 @@ async fn run(cli: cli::CliArgs) -> Result<()> {
|
|||
// so Ctrl+K can kill processes even when the agent is busy.
|
||||
let process_tracker = agent.lock().await.process_tracker.clone();
|
||||
|
||||
// Try to restore from conversation log (primary) or session file (fallback)
|
||||
let session_file = config.session_dir.join("current.json");
|
||||
// Restore conversation from the append-only log
|
||||
{
|
||||
let mut agent_guard = agent.lock().await;
|
||||
let restored = agent_guard.restore_from_log(
|
||||
if agent_guard.restore_from_log(
|
||||
config.system_prompt.clone(),
|
||||
config.context_parts.clone(),
|
||||
);
|
||||
if restored {
|
||||
) {
|
||||
replay_session_to_ui(agent_guard.entries(), &ui_tx);
|
||||
let _ = ui_tx.send(UiMessage::Info(
|
||||
"--- restored from conversation log ---".into(),
|
||||
));
|
||||
} else if session_file.exists() {
|
||||
if let Ok(data) = std::fs::read_to_string(&session_file) {
|
||||
if let Ok(messages) = serde_json::from_str(&data) {
|
||||
agent_guard.restore(messages);
|
||||
replay_session_to_ui(agent_guard.entries(), &ui_tx);
|
||||
let _ = ui_tx.send(UiMessage::Info(
|
||||
"--- restored from session file ---".into(),
|
||||
));
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
|
|
@ -978,7 +947,6 @@ async fn run(cli: cli::CliArgs) -> Result<()> {
|
|||
process_tracker,
|
||||
ui_tx.clone(),
|
||||
turn_tx,
|
||||
session_file,
|
||||
);
|
||||
session.update_status();
|
||||
session.send_context_info();
|
||||
|
|
@ -1103,12 +1071,6 @@ fn drain_ui_messages(rx: &mut ui_channel::UiReceiver, app: &mut tui::App) {
|
|||
}
|
||||
}
|
||||
|
||||
fn save_session(agent: &Agent, path: &PathBuf) -> Result<()> {
|
||||
let data = serde_json::to_string_pretty(agent.entries())?;
|
||||
std::fs::write(path, data)?;
|
||||
Ok(())
|
||||
}
|
||||
|
||||
async fn run_tool_tests(ui_tx: &ui_channel::UiSender, tracker: &tools::ProcessTracker) {
|
||||
use serde_json::json;
|
||||
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue