perf(memory): wrap blocking SQLite calls in tokio::task::spawn_blocking

Problem:
Every async fn in SqliteMemory acquired self.conn.lock() and ran
synchronous rusqlite queries directly on the Tokio runtime thread.
This blocks the async executor, preventing other tasks from making
progress — especially harmful under concurrent recall/store load.

Fix:
- Change conn from Mutex<Connection> to Arc<Mutex<Connection>> so
  the connection handle can be cloned into spawn_blocking closures.
- Wrap all synchronous database operations (store, recall, get, list,
  forget, count, health_check) in tokio::task::spawn_blocking.
- Split get_or_compute_embedding into three phases: cache check
  (blocking), embedding computation (async I/O), cache store
  (blocking) — ensuring no lock is held across await points.
- Apply the same pattern to the reindex method.

The async I/O (embedding computation) remains on the Tokio runtime
while all SQLite access runs on the blocking thread pool, preventing
executor starvation.

Ref: zeroclaw-labs/zeroclaw#710 (Item 4)

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
This commit is contained in:
Alex Gorevski 2026-02-17 19:48:51 -08:00 committed by Chummy
parent 83b098d7ac
commit 4e528dde7d

View file

@ -25,7 +25,7 @@ const SQLITE_OPEN_TIMEOUT_CAP_SECS: u64 = 300;
/// - **Embedding Cache**: LRU-evicted cache to avoid redundant API calls /// - **Embedding Cache**: LRU-evicted cache to avoid redundant API calls
/// - **Safe Reindex**: temp DB → seed → sync → atomic swap → rollback /// - **Safe Reindex**: temp DB → seed → sync → atomic swap → rollback
pub struct SqliteMemory { pub struct SqliteMemory {
conn: Mutex<Connection>, conn: Arc<Mutex<Connection>>,
db_path: PathBuf, db_path: PathBuf,
embedder: Arc<dyn EmbeddingProvider>, embedder: Arc<dyn EmbeddingProvider>,
vector_weight: f32, vector_weight: f32,
@ -83,7 +83,7 @@ impl SqliteMemory {
Self::init_schema(&conn)?; Self::init_schema(&conn)?;
Ok(Self { Ok(Self {
conn: Mutex::new(conn), conn: Arc::new(Mutex::new(conn)),
db_path, db_path,
embedder, embedder,
vector_weight, vector_weight,
@ -229,50 +229,56 @@ impl SqliteMemory {
let hash = Self::content_hash(text); let hash = Self::content_hash(text);
let now = Local::now().to_rfc3339(); let now = Local::now().to_rfc3339();
// Check cache // Check cache (offloaded to blocking thread)
{ let conn = self.conn.clone();
let conn = self.conn.lock(); let hash_c = hash.clone();
let now_c = now.clone();
let cached = tokio::task::spawn_blocking(move || -> anyhow::Result<Option<Vec<f32>>> {
let conn = conn.lock();
let mut stmt = let mut stmt =
conn.prepare("SELECT embedding FROM embedding_cache WHERE content_hash = ?1")?; conn.prepare("SELECT embedding FROM embedding_cache WHERE content_hash = ?1")?;
let cached: Option<Vec<u8>> = stmt.query_row(params![hash], |row| row.get(0)).ok(); let blob: Option<Vec<u8>> = stmt.query_row(params![hash_c], |row| row.get(0)).ok();
if let Some(bytes) = blob {
if let Some(bytes) = cached {
// Update accessed_at for LRU
conn.execute( conn.execute(
"UPDATE embedding_cache SET accessed_at = ?1 WHERE content_hash = ?2", "UPDATE embedding_cache SET accessed_at = ?1 WHERE content_hash = ?2",
params![now, hash], params![now_c, hash_c],
)?; )?;
return Ok(Some(vector::bytes_to_vec(&bytes))); return Ok(Some(vector::bytes_to_vec(&bytes)));
} }
Ok(None)
})
.await??;
if cached.is_some() {
return Ok(cached);
} }
// Compute embedding // Compute embedding (async I/O)
let embedding = self.embedder.embed_one(text).await?; let embedding = self.embedder.embed_one(text).await?;
let bytes = vector::vec_to_bytes(&embedding); let bytes = vector::vec_to_bytes(&embedding);
// Store in cache + LRU eviction // Store in cache + LRU eviction (offloaded to blocking thread)
{ let conn = self.conn.clone();
let conn = self.conn.lock(); #[allow(clippy::cast_possible_wrap)]
let cache_max = self.cache_max as i64;
tokio::task::spawn_blocking(move || -> anyhow::Result<()> {
let conn = conn.lock();
conn.execute( conn.execute(
"INSERT OR REPLACE INTO embedding_cache (content_hash, embedding, created_at, accessed_at) "INSERT OR REPLACE INTO embedding_cache (content_hash, embedding, created_at, accessed_at)
VALUES (?1, ?2, ?3, ?4)", VALUES (?1, ?2, ?3, ?4)",
params![hash, bytes, now, now], params![hash, bytes, now, now],
)?; )?;
// LRU eviction: keep only cache_max entries
#[allow(clippy::cast_possible_wrap)]
let max = self.cache_max as i64;
conn.execute( conn.execute(
"DELETE FROM embedding_cache WHERE content_hash IN ( "DELETE FROM embedding_cache WHERE content_hash IN (
SELECT content_hash FROM embedding_cache SELECT content_hash FROM embedding_cache
ORDER BY accessed_at ASC ORDER BY accessed_at ASC
LIMIT MAX(0, (SELECT COUNT(*) FROM embedding_cache) - ?1) LIMIT MAX(0, (SELECT COUNT(*) FROM embedding_cache) - ?1)
)", )",
params![max], params![cache_max],
)?; )?;
} Ok(())
})
.await??;
Ok(Some(embedding)) Ok(Some(embedding))
} }
@ -355,9 +361,13 @@ impl SqliteMemory {
pub async fn reindex(&self) -> anyhow::Result<usize> { pub async fn reindex(&self) -> anyhow::Result<usize> {
// Step 1: Rebuild FTS5 // Step 1: Rebuild FTS5
{ {
let conn = self.conn.lock(); let conn = self.conn.clone();
tokio::task::spawn_blocking(move || -> anyhow::Result<()> {
let conn = conn.lock();
conn.execute_batch("INSERT INTO memories_fts(memories_fts) VALUES('rebuild');")?; conn.execute_batch("INSERT INTO memories_fts(memories_fts) VALUES('rebuild');")?;
Ok(())
})
.await??;
} }
// Step 2: Re-embed all memories that lack embeddings // Step 2: Re-embed all memories that lack embeddings
@ -365,26 +375,33 @@ impl SqliteMemory {
return Ok(0); return Ok(0);
} }
let entries: Vec<(String, String)> = { let conn = self.conn.clone();
let conn = self.conn.lock(); let entries: Vec<(String, String)> = tokio::task::spawn_blocking(move || {
let conn = conn.lock();
let mut stmt = let mut stmt =
conn.prepare("SELECT id, content FROM memories WHERE embedding IS NULL")?; conn.prepare("SELECT id, content FROM memories WHERE embedding IS NULL")?;
let rows = stmt.query_map([], |row| { let rows = stmt.query_map([], |row| {
Ok((row.get::<_, String>(0)?, row.get::<_, String>(1)?)) Ok((row.get::<_, String>(0)?, row.get::<_, String>(1)?))
})?; })?;
rows.filter_map(std::result::Result::ok).collect() Ok::<_, anyhow::Error>(rows.filter_map(std::result::Result::ok).collect())
}; })
.await??;
let mut count = 0; let mut count = 0;
for (id, content) in &entries { for (id, content) in &entries {
if let Ok(Some(emb)) = self.get_or_compute_embedding(content).await { if let Ok(Some(emb)) = self.get_or_compute_embedding(content).await {
let bytes = vector::vec_to_bytes(&emb); let bytes = vector::vec_to_bytes(&emb);
let conn = self.conn.lock(); let conn = self.conn.clone();
let id = id.clone();
tokio::task::spawn_blocking(move || -> anyhow::Result<()> {
let conn = conn.lock();
conn.execute( conn.execute(
"UPDATE memories SET embedding = ?1 WHERE id = ?2", "UPDATE memories SET embedding = ?1 WHERE id = ?2",
params![bytes, id], params![bytes, id],
)?; )?;
Ok(())
})
.await??;
count += 1; count += 1;
} }
} }
@ -406,13 +423,19 @@ impl Memory for SqliteMemory {
category: MemoryCategory, category: MemoryCategory,
session_id: Option<&str>, session_id: Option<&str>,
) -> anyhow::Result<()> { ) -> anyhow::Result<()> {
// Compute embedding (async, before lock) // Compute embedding (async, before blocking work)
let embedding_bytes = self let embedding_bytes = self
.get_or_compute_embedding(content) .get_or_compute_embedding(content)
.await? .await?
.map(|emb| vector::vec_to_bytes(&emb)); .map(|emb| vector::vec_to_bytes(&emb));
let conn = self.conn.lock(); let conn = self.conn.clone();
let key = key.to_string();
let content = content.to_string();
let session_id = session_id.map(String::from);
tokio::task::spawn_blocking(move || -> anyhow::Result<()> {
let conn = conn.lock();
let now = Local::now().to_rfc3339(); let now = Local::now().to_rfc3339();
let cat = Self::category_to_str(&category); let cat = Self::category_to_str(&category);
let id = Uuid::new_v4().to_string(); let id = Uuid::new_v4().to_string();
@ -428,8 +451,9 @@ impl Memory for SqliteMemory {
session_id = excluded.session_id", session_id = excluded.session_id",
params![id, key, content, cat, embedding_bytes, now, now, session_id], params![id, key, content, cat, embedding_bytes, now, now, session_id],
)?; )?;
Ok(()) Ok(())
})
.await?
} }
async fn recall( async fn recall(
@ -442,13 +466,22 @@ impl Memory for SqliteMemory {
return Ok(Vec::new()); return Ok(Vec::new());
} }
// Compute query embedding (async, before lock) // Compute query embedding (async, before blocking work)
let query_embedding = self.get_or_compute_embedding(query).await?; let query_embedding = self.get_or_compute_embedding(query).await?;
let conn = self.conn.lock(); let conn = self.conn.clone();
let query = query.to_string();
let session_id = session_id.map(String::from);
let vector_weight = self.vector_weight;
let keyword_weight = self.keyword_weight;
tokio::task::spawn_blocking(move || -> anyhow::Result<Vec<MemoryEntry>> {
let conn = conn.lock();
let session_ref = session_id.as_deref();
// FTS5 BM25 keyword search // FTS5 BM25 keyword search
let keyword_results = Self::fts5_search(&conn, query, limit * 2).unwrap_or_default(); let keyword_results =
Self::fts5_search(&conn, &query, limit * 2).unwrap_or_default();
// Vector similarity search (if embeddings available) // Vector similarity search (if embeddings available)
let vector_results = if let Some(ref qe) = query_embedding { let vector_results = if let Some(ref qe) = query_embedding {
@ -459,7 +492,6 @@ impl Memory for SqliteMemory {
// Hybrid merge // Hybrid merge
let merged = if vector_results.is_empty() { let merged = if vector_results.is_empty() {
// No embeddings — use keyword results only
keyword_results keyword_results
.iter() .iter()
.map(|(id, score)| vector::ScoredResult { .map(|(id, score)| vector::ScoredResult {
@ -473,8 +505,8 @@ impl Memory for SqliteMemory {
vector::hybrid_merge( vector::hybrid_merge(
&vector_results, &vector_results,
&keyword_results, &keyword_results,
self.vector_weight, vector_weight,
self.keyword_weight, keyword_weight,
limit, limit,
) )
}; };
@ -496,8 +528,7 @@ impl Memory for SqliteMemory {
score: Some(f64::from(scored.final_score)), score: Some(f64::from(scored.final_score)),
}) })
}) { }) {
// Filter by session_id if requested if let Some(sid) = session_ref {
if let Some(sid) = session_id {
if entry.session_id.as_deref() != Some(sid) { if entry.session_id.as_deref() != Some(sid) {
continue; continue;
} }
@ -515,7 +546,11 @@ impl Memory for SqliteMemory {
.iter() .iter()
.enumerate() .enumerate()
.map(|(i, _)| { .map(|(i, _)| {
format!("(content LIKE ?{} OR key LIKE ?{})", i * 2 + 1, i * 2 + 2) format!(
"(content LIKE ?{} OR key LIKE ?{})",
i * 2 + 1,
i * 2 + 2
)
}) })
.collect(); .collect();
let where_clause = conditions.join(" OR "); let where_clause = conditions.join(" OR ");
@ -549,7 +584,7 @@ impl Memory for SqliteMemory {
})?; })?;
for row in rows { for row in rows {
let entry = row?; let entry = row?;
if let Some(sid) = session_id { if let Some(sid) = session_ref {
if entry.session_id.as_deref() != Some(sid) { if entry.session_id.as_deref() != Some(sid) {
continue; continue;
} }
@ -561,11 +596,16 @@ impl Memory for SqliteMemory {
results.truncate(limit); results.truncate(limit);
Ok(results) Ok(results)
})
.await?
} }
async fn get(&self, key: &str) -> anyhow::Result<Option<MemoryEntry>> { async fn get(&self, key: &str) -> anyhow::Result<Option<MemoryEntry>> {
let conn = self.conn.lock(); let conn = self.conn.clone();
let key = key.to_string();
tokio::task::spawn_blocking(move || -> anyhow::Result<Option<MemoryEntry>> {
let conn = conn.lock();
let mut stmt = conn.prepare( let mut stmt = conn.prepare(
"SELECT id, key, content, category, created_at, session_id FROM memories WHERE key = ?1", "SELECT id, key, content, category, created_at, session_id FROM memories WHERE key = ?1",
)?; )?;
@ -586,6 +626,8 @@ impl Memory for SqliteMemory {
Some(Ok(entry)) => Ok(Some(entry)), Some(Ok(entry)) => Ok(Some(entry)),
_ => Ok(None), _ => Ok(None),
} }
})
.await?
} }
async fn list( async fn list(
@ -593,8 +635,13 @@ impl Memory for SqliteMemory {
category: Option<&MemoryCategory>, category: Option<&MemoryCategory>,
session_id: Option<&str>, session_id: Option<&str>,
) -> anyhow::Result<Vec<MemoryEntry>> { ) -> anyhow::Result<Vec<MemoryEntry>> {
let conn = self.conn.lock(); let conn = self.conn.clone();
let category = category.cloned();
let session_id = session_id.map(String::from);
tokio::task::spawn_blocking(move || -> anyhow::Result<Vec<MemoryEntry>> {
let conn = conn.lock();
let session_ref = session_id.as_deref();
let mut results = Vec::new(); let mut results = Vec::new();
let row_mapper = |row: &rusqlite::Row| -> rusqlite::Result<MemoryEntry> { let row_mapper = |row: &rusqlite::Row| -> rusqlite::Result<MemoryEntry> {
@ -609,7 +656,7 @@ impl Memory for SqliteMemory {
}) })
}; };
if let Some(cat) = category { if let Some(ref cat) = category {
let cat_str = Self::category_to_str(cat); let cat_str = Self::category_to_str(cat);
let mut stmt = conn.prepare( let mut stmt = conn.prepare(
"SELECT id, key, content, category, created_at, session_id FROM memories "SELECT id, key, content, category, created_at, session_id FROM memories
@ -618,7 +665,7 @@ impl Memory for SqliteMemory {
let rows = stmt.query_map(params![cat_str], row_mapper)?; let rows = stmt.query_map(params![cat_str], row_mapper)?;
for row in rows { for row in rows {
let entry = row?; let entry = row?;
if let Some(sid) = session_id { if let Some(sid) = session_ref {
if entry.session_id.as_deref() != Some(sid) { if entry.session_id.as_deref() != Some(sid) {
continue; continue;
} }
@ -633,7 +680,7 @@ impl Memory for SqliteMemory {
let rows = stmt.query_map([], row_mapper)?; let rows = stmt.query_map([], row_mapper)?;
for row in rows { for row in rows {
let entry = row?; let entry = row?;
if let Some(sid) = session_id { if let Some(sid) = session_ref {
if entry.session_id.as_deref() != Some(sid) { if entry.session_id.as_deref() != Some(sid) {
continue; continue;
} }
@ -643,23 +690,40 @@ impl Memory for SqliteMemory {
} }
Ok(results) Ok(results)
})
.await?
} }
async fn forget(&self, key: &str) -> anyhow::Result<bool> { async fn forget(&self, key: &str) -> anyhow::Result<bool> {
let conn = self.conn.lock(); let conn = self.conn.clone();
let key = key.to_string();
tokio::task::spawn_blocking(move || -> anyhow::Result<bool> {
let conn = conn.lock();
let affected = conn.execute("DELETE FROM memories WHERE key = ?1", params![key])?; let affected = conn.execute("DELETE FROM memories WHERE key = ?1", params![key])?;
Ok(affected > 0) Ok(affected > 0)
})
.await?
} }
async fn count(&self) -> anyhow::Result<usize> { async fn count(&self) -> anyhow::Result<usize> {
let conn = self.conn.lock(); let conn = self.conn.clone();
let count: i64 = conn.query_row("SELECT COUNT(*) FROM memories", [], |row| row.get(0))?;
tokio::task::spawn_blocking(move || -> anyhow::Result<usize> {
let conn = conn.lock();
let count: i64 =
conn.query_row("SELECT COUNT(*) FROM memories", [], |row| row.get(0))?;
#[allow(clippy::cast_sign_loss, clippy::cast_possible_truncation)] #[allow(clippy::cast_sign_loss, clippy::cast_possible_truncation)]
Ok(count as usize) Ok(count as usize)
})
.await?
} }
async fn health_check(&self) -> bool { async fn health_check(&self) -> bool {
self.conn.lock().execute_batch("SELECT 1").is_ok() let conn = self.conn.clone();
tokio::task::spawn_blocking(move || conn.lock().execute_batch("SELECT 1").is_ok())
.await
.unwrap_or(false)
} }
} }