perf(memory): wrap blocking SQLite calls in tokio::task::spawn_blocking
Problem: Every async fn in SqliteMemory acquired self.conn.lock() and ran synchronous rusqlite queries directly on the Tokio runtime thread. This blocks the async executor, preventing other tasks from making progress — especially harmful under concurrent recall/store load. Fix: - Change conn from Mutex<Connection> to Arc<Mutex<Connection>> so the connection handle can be cloned into spawn_blocking closures. - Wrap all synchronous database operations (store, recall, get, list, forget, count, health_check) in tokio::task::spawn_blocking. - Split get_or_compute_embedding into three phases: cache check (blocking), embedding computation (async I/O), cache store (blocking) — ensuring no lock is held across await points. - Apply the same pattern to the reindex method. The async I/O (embedding computation) remains on the Tokio runtime while all SQLite access runs on the blocking thread pool, preventing executor starvation. Ref: zeroclaw-labs/zeroclaw#710 (Item 4) Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
This commit is contained in:
parent
83b098d7ac
commit
4e528dde7d
1 changed files with 279 additions and 215 deletions
|
|
@ -25,7 +25,7 @@ const SQLITE_OPEN_TIMEOUT_CAP_SECS: u64 = 300;
|
|||
/// - **Embedding Cache**: LRU-evicted cache to avoid redundant API calls
|
||||
/// - **Safe Reindex**: temp DB → seed → sync → atomic swap → rollback
|
||||
pub struct SqliteMemory {
|
||||
conn: Mutex<Connection>,
|
||||
conn: Arc<Mutex<Connection>>,
|
||||
db_path: PathBuf,
|
||||
embedder: Arc<dyn EmbeddingProvider>,
|
||||
vector_weight: f32,
|
||||
|
|
@ -83,7 +83,7 @@ impl SqliteMemory {
|
|||
Self::init_schema(&conn)?;
|
||||
|
||||
Ok(Self {
|
||||
conn: Mutex::new(conn),
|
||||
conn: Arc::new(Mutex::new(conn)),
|
||||
db_path,
|
||||
embedder,
|
||||
vector_weight,
|
||||
|
|
@ -229,50 +229,56 @@ impl SqliteMemory {
|
|||
let hash = Self::content_hash(text);
|
||||
let now = Local::now().to_rfc3339();
|
||||
|
||||
// Check cache
|
||||
{
|
||||
let conn = self.conn.lock();
|
||||
|
||||
// Check cache (offloaded to blocking thread)
|
||||
let conn = self.conn.clone();
|
||||
let hash_c = hash.clone();
|
||||
let now_c = now.clone();
|
||||
let cached = tokio::task::spawn_blocking(move || -> anyhow::Result<Option<Vec<f32>>> {
|
||||
let conn = conn.lock();
|
||||
let mut stmt =
|
||||
conn.prepare("SELECT embedding FROM embedding_cache WHERE content_hash = ?1")?;
|
||||
let cached: Option<Vec<u8>> = stmt.query_row(params![hash], |row| row.get(0)).ok();
|
||||
|
||||
if let Some(bytes) = cached {
|
||||
// Update accessed_at for LRU
|
||||
let blob: Option<Vec<u8>> = stmt.query_row(params![hash_c], |row| row.get(0)).ok();
|
||||
if let Some(bytes) = blob {
|
||||
conn.execute(
|
||||
"UPDATE embedding_cache SET accessed_at = ?1 WHERE content_hash = ?2",
|
||||
params![now, hash],
|
||||
params![now_c, hash_c],
|
||||
)?;
|
||||
return Ok(Some(vector::bytes_to_vec(&bytes)));
|
||||
}
|
||||
Ok(None)
|
||||
})
|
||||
.await??;
|
||||
|
||||
if cached.is_some() {
|
||||
return Ok(cached);
|
||||
}
|
||||
|
||||
// Compute embedding
|
||||
// Compute embedding (async I/O)
|
||||
let embedding = self.embedder.embed_one(text).await?;
|
||||
let bytes = vector::vec_to_bytes(&embedding);
|
||||
|
||||
// Store in cache + LRU eviction
|
||||
{
|
||||
let conn = self.conn.lock();
|
||||
|
||||
// Store in cache + LRU eviction (offloaded to blocking thread)
|
||||
let conn = self.conn.clone();
|
||||
#[allow(clippy::cast_possible_wrap)]
|
||||
let cache_max = self.cache_max as i64;
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<()> {
|
||||
let conn = conn.lock();
|
||||
conn.execute(
|
||||
"INSERT OR REPLACE INTO embedding_cache (content_hash, embedding, created_at, accessed_at)
|
||||
VALUES (?1, ?2, ?3, ?4)",
|
||||
params![hash, bytes, now, now],
|
||||
)?;
|
||||
|
||||
// LRU eviction: keep only cache_max entries
|
||||
#[allow(clippy::cast_possible_wrap)]
|
||||
let max = self.cache_max as i64;
|
||||
conn.execute(
|
||||
"DELETE FROM embedding_cache WHERE content_hash IN (
|
||||
SELECT content_hash FROM embedding_cache
|
||||
ORDER BY accessed_at ASC
|
||||
LIMIT MAX(0, (SELECT COUNT(*) FROM embedding_cache) - ?1)
|
||||
)",
|
||||
params![max],
|
||||
params![cache_max],
|
||||
)?;
|
||||
}
|
||||
Ok(())
|
||||
})
|
||||
.await??;
|
||||
|
||||
Ok(Some(embedding))
|
||||
}
|
||||
|
|
@ -355,9 +361,13 @@ impl SqliteMemory {
|
|||
pub async fn reindex(&self) -> anyhow::Result<usize> {
|
||||
// Step 1: Rebuild FTS5
|
||||
{
|
||||
let conn = self.conn.lock();
|
||||
|
||||
let conn = self.conn.clone();
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<()> {
|
||||
let conn = conn.lock();
|
||||
conn.execute_batch("INSERT INTO memories_fts(memories_fts) VALUES('rebuild');")?;
|
||||
Ok(())
|
||||
})
|
||||
.await??;
|
||||
}
|
||||
|
||||
// Step 2: Re-embed all memories that lack embeddings
|
||||
|
|
@ -365,26 +375,33 @@ impl SqliteMemory {
|
|||
return Ok(0);
|
||||
}
|
||||
|
||||
let entries: Vec<(String, String)> = {
|
||||
let conn = self.conn.lock();
|
||||
|
||||
let conn = self.conn.clone();
|
||||
let entries: Vec<(String, String)> = tokio::task::spawn_blocking(move || {
|
||||
let conn = conn.lock();
|
||||
let mut stmt =
|
||||
conn.prepare("SELECT id, content FROM memories WHERE embedding IS NULL")?;
|
||||
let rows = stmt.query_map([], |row| {
|
||||
Ok((row.get::<_, String>(0)?, row.get::<_, String>(1)?))
|
||||
})?;
|
||||
rows.filter_map(std::result::Result::ok).collect()
|
||||
};
|
||||
Ok::<_, anyhow::Error>(rows.filter_map(std::result::Result::ok).collect())
|
||||
})
|
||||
.await??;
|
||||
|
||||
let mut count = 0;
|
||||
for (id, content) in &entries {
|
||||
if let Ok(Some(emb)) = self.get_or_compute_embedding(content).await {
|
||||
let bytes = vector::vec_to_bytes(&emb);
|
||||
let conn = self.conn.lock();
|
||||
let conn = self.conn.clone();
|
||||
let id = id.clone();
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<()> {
|
||||
let conn = conn.lock();
|
||||
conn.execute(
|
||||
"UPDATE memories SET embedding = ?1 WHERE id = ?2",
|
||||
params![bytes, id],
|
||||
)?;
|
||||
Ok(())
|
||||
})
|
||||
.await??;
|
||||
count += 1;
|
||||
}
|
||||
}
|
||||
|
|
@ -406,13 +423,19 @@ impl Memory for SqliteMemory {
|
|||
category: MemoryCategory,
|
||||
session_id: Option<&str>,
|
||||
) -> anyhow::Result<()> {
|
||||
// Compute embedding (async, before lock)
|
||||
// Compute embedding (async, before blocking work)
|
||||
let embedding_bytes = self
|
||||
.get_or_compute_embedding(content)
|
||||
.await?
|
||||
.map(|emb| vector::vec_to_bytes(&emb));
|
||||
|
||||
let conn = self.conn.lock();
|
||||
let conn = self.conn.clone();
|
||||
let key = key.to_string();
|
||||
let content = content.to_string();
|
||||
let session_id = session_id.map(String::from);
|
||||
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<()> {
|
||||
let conn = conn.lock();
|
||||
let now = Local::now().to_rfc3339();
|
||||
let cat = Self::category_to_str(&category);
|
||||
let id = Uuid::new_v4().to_string();
|
||||
|
|
@ -428,8 +451,9 @@ impl Memory for SqliteMemory {
|
|||
session_id = excluded.session_id",
|
||||
params![id, key, content, cat, embedding_bytes, now, now, session_id],
|
||||
)?;
|
||||
|
||||
Ok(())
|
||||
})
|
||||
.await?
|
||||
}
|
||||
|
||||
async fn recall(
|
||||
|
|
@ -442,13 +466,22 @@ impl Memory for SqliteMemory {
|
|||
return Ok(Vec::new());
|
||||
}
|
||||
|
||||
// Compute query embedding (async, before lock)
|
||||
// Compute query embedding (async, before blocking work)
|
||||
let query_embedding = self.get_or_compute_embedding(query).await?;
|
||||
|
||||
let conn = self.conn.lock();
|
||||
let conn = self.conn.clone();
|
||||
let query = query.to_string();
|
||||
let session_id = session_id.map(String::from);
|
||||
let vector_weight = self.vector_weight;
|
||||
let keyword_weight = self.keyword_weight;
|
||||
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<Vec<MemoryEntry>> {
|
||||
let conn = conn.lock();
|
||||
let session_ref = session_id.as_deref();
|
||||
|
||||
// FTS5 BM25 keyword search
|
||||
let keyword_results = Self::fts5_search(&conn, query, limit * 2).unwrap_or_default();
|
||||
let keyword_results =
|
||||
Self::fts5_search(&conn, &query, limit * 2).unwrap_or_default();
|
||||
|
||||
// Vector similarity search (if embeddings available)
|
||||
let vector_results = if let Some(ref qe) = query_embedding {
|
||||
|
|
@ -459,7 +492,6 @@ impl Memory for SqliteMemory {
|
|||
|
||||
// Hybrid merge
|
||||
let merged = if vector_results.is_empty() {
|
||||
// No embeddings — use keyword results only
|
||||
keyword_results
|
||||
.iter()
|
||||
.map(|(id, score)| vector::ScoredResult {
|
||||
|
|
@ -473,8 +505,8 @@ impl Memory for SqliteMemory {
|
|||
vector::hybrid_merge(
|
||||
&vector_results,
|
||||
&keyword_results,
|
||||
self.vector_weight,
|
||||
self.keyword_weight,
|
||||
vector_weight,
|
||||
keyword_weight,
|
||||
limit,
|
||||
)
|
||||
};
|
||||
|
|
@ -496,8 +528,7 @@ impl Memory for SqliteMemory {
|
|||
score: Some(f64::from(scored.final_score)),
|
||||
})
|
||||
}) {
|
||||
// Filter by session_id if requested
|
||||
if let Some(sid) = session_id {
|
||||
if let Some(sid) = session_ref {
|
||||
if entry.session_id.as_deref() != Some(sid) {
|
||||
continue;
|
||||
}
|
||||
|
|
@ -515,7 +546,11 @@ impl Memory for SqliteMemory {
|
|||
.iter()
|
||||
.enumerate()
|
||||
.map(|(i, _)| {
|
||||
format!("(content LIKE ?{} OR key LIKE ?{})", i * 2 + 1, i * 2 + 2)
|
||||
format!(
|
||||
"(content LIKE ?{} OR key LIKE ?{})",
|
||||
i * 2 + 1,
|
||||
i * 2 + 2
|
||||
)
|
||||
})
|
||||
.collect();
|
||||
let where_clause = conditions.join(" OR ");
|
||||
|
|
@ -549,7 +584,7 @@ impl Memory for SqliteMemory {
|
|||
})?;
|
||||
for row in rows {
|
||||
let entry = row?;
|
||||
if let Some(sid) = session_id {
|
||||
if let Some(sid) = session_ref {
|
||||
if entry.session_id.as_deref() != Some(sid) {
|
||||
continue;
|
||||
}
|
||||
|
|
@ -561,11 +596,16 @@ impl Memory for SqliteMemory {
|
|||
|
||||
results.truncate(limit);
|
||||
Ok(results)
|
||||
})
|
||||
.await?
|
||||
}
|
||||
|
||||
async fn get(&self, key: &str) -> anyhow::Result<Option<MemoryEntry>> {
|
||||
let conn = self.conn.lock();
|
||||
let conn = self.conn.clone();
|
||||
let key = key.to_string();
|
||||
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<Option<MemoryEntry>> {
|
||||
let conn = conn.lock();
|
||||
let mut stmt = conn.prepare(
|
||||
"SELECT id, key, content, category, created_at, session_id FROM memories WHERE key = ?1",
|
||||
)?;
|
||||
|
|
@ -586,6 +626,8 @@ impl Memory for SqliteMemory {
|
|||
Some(Ok(entry)) => Ok(Some(entry)),
|
||||
_ => Ok(None),
|
||||
}
|
||||
})
|
||||
.await?
|
||||
}
|
||||
|
||||
async fn list(
|
||||
|
|
@ -593,8 +635,13 @@ impl Memory for SqliteMemory {
|
|||
category: Option<&MemoryCategory>,
|
||||
session_id: Option<&str>,
|
||||
) -> anyhow::Result<Vec<MemoryEntry>> {
|
||||
let conn = self.conn.lock();
|
||||
let conn = self.conn.clone();
|
||||
let category = category.cloned();
|
||||
let session_id = session_id.map(String::from);
|
||||
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<Vec<MemoryEntry>> {
|
||||
let conn = conn.lock();
|
||||
let session_ref = session_id.as_deref();
|
||||
let mut results = Vec::new();
|
||||
|
||||
let row_mapper = |row: &rusqlite::Row| -> rusqlite::Result<MemoryEntry> {
|
||||
|
|
@ -609,7 +656,7 @@ impl Memory for SqliteMemory {
|
|||
})
|
||||
};
|
||||
|
||||
if let Some(cat) = category {
|
||||
if let Some(ref cat) = category {
|
||||
let cat_str = Self::category_to_str(cat);
|
||||
let mut stmt = conn.prepare(
|
||||
"SELECT id, key, content, category, created_at, session_id FROM memories
|
||||
|
|
@ -618,7 +665,7 @@ impl Memory for SqliteMemory {
|
|||
let rows = stmt.query_map(params![cat_str], row_mapper)?;
|
||||
for row in rows {
|
||||
let entry = row?;
|
||||
if let Some(sid) = session_id {
|
||||
if let Some(sid) = session_ref {
|
||||
if entry.session_id.as_deref() != Some(sid) {
|
||||
continue;
|
||||
}
|
||||
|
|
@ -633,7 +680,7 @@ impl Memory for SqliteMemory {
|
|||
let rows = stmt.query_map([], row_mapper)?;
|
||||
for row in rows {
|
||||
let entry = row?;
|
||||
if let Some(sid) = session_id {
|
||||
if let Some(sid) = session_ref {
|
||||
if entry.session_id.as_deref() != Some(sid) {
|
||||
continue;
|
||||
}
|
||||
|
|
@ -643,23 +690,40 @@ impl Memory for SqliteMemory {
|
|||
}
|
||||
|
||||
Ok(results)
|
||||
})
|
||||
.await?
|
||||
}
|
||||
|
||||
async fn forget(&self, key: &str) -> anyhow::Result<bool> {
|
||||
let conn = self.conn.lock();
|
||||
let conn = self.conn.clone();
|
||||
let key = key.to_string();
|
||||
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<bool> {
|
||||
let conn = conn.lock();
|
||||
let affected = conn.execute("DELETE FROM memories WHERE key = ?1", params![key])?;
|
||||
Ok(affected > 0)
|
||||
})
|
||||
.await?
|
||||
}
|
||||
|
||||
async fn count(&self) -> anyhow::Result<usize> {
|
||||
let conn = self.conn.lock();
|
||||
let count: i64 = conn.query_row("SELECT COUNT(*) FROM memories", [], |row| row.get(0))?;
|
||||
let conn = self.conn.clone();
|
||||
|
||||
tokio::task::spawn_blocking(move || -> anyhow::Result<usize> {
|
||||
let conn = conn.lock();
|
||||
let count: i64 =
|
||||
conn.query_row("SELECT COUNT(*) FROM memories", [], |row| row.get(0))?;
|
||||
#[allow(clippy::cast_sign_loss, clippy::cast_possible_truncation)]
|
||||
Ok(count as usize)
|
||||
})
|
||||
.await?
|
||||
}
|
||||
|
||||
async fn health_check(&self) -> bool {
|
||||
self.conn.lock().execute_batch("SELECT 1").is_ok()
|
||||
let conn = self.conn.clone();
|
||||
tokio::task::spawn_blocking(move || conn.lock().execute_batch("SELECT 1").is_ok())
|
||||
.await
|
||||
.unwrap_or(false)
|
||||
}
|
||||
}
|
||||
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue