Convex MCP server

Official

7,510

Overview InspectNew Endpoints Schema Related Servers Reviews Score

mod.rs•40 kB

use std::{ cmp, collections::BTreeMap, iter, mem, sync::{ atomic::{ AtomicU32, Ordering, }, Arc, LazyLock, }, time::{ Duration, SystemTime, }, }; use async_broadcast::{ broadcast, Receiver, Sender, }; use common::{ components::PublicFunctionPath, execution_context::ExecutionContext, identity::IdentityCacheKey, knobs::{ DATABASE_UDF_SYSTEM_TIMEOUT, DATABASE_UDF_USER_TIMEOUT, }, query_journal::QueryJournal, runtime::Runtime, types::{ AllowedVisibility, FunctionCaller, TableName, TableStats, Timestamp, UdfType, }, value::ConvexArray, RequestId, }; use database::{ Database, Token, }; use errors::ErrorMetadataAnyhowExt; use futures::{ select_biased, FutureExt, }; use keybroker::Identity; use lru::LruCache; use metrics::{ get_timer, log_cache_size, log_drop_cache_result_too_old, log_perform_go, log_perform_wait_peer_timeout, log_perform_wait_self_timeout, log_plan_go, log_plan_peer_timeout, log_plan_ready, log_plan_wait, log_query_bandwidth_bytes, log_success, log_validate_refresh_failed, log_validate_system_time_in_the_future, log_validate_system_time_too_old, log_validate_ts_too_old, query_cache_log_eviction, succeed_get_timer, GoReason, }; use parking_lot::Mutex; use smallvec::{ smallvec, SmallVec, }; use udf::{ validation::ValidatedPathAndArgs, FunctionOutcome, UdfOutcome, }; use usage_tracking::FunctionUsageTracker; use value::{ heap_size::HeapSize, ConvexValue, }; use crate::{ application_function_runner::FunctionRouter, function_log::FunctionExecutionLog, QueryReturn, }; mod metrics; // Maximum age of results to tolerate if they're time-dependent. pub const MAX_CACHE_AGE: Duration = Duration::from_secs(5); static TOTAL_QUERY_TIMEOUT: LazyLock<Duration> = LazyLock::new(|| *DATABASE_UDF_USER_TIMEOUT + *DATABASE_UDF_SYSTEM_TIMEOUT); #[derive(Clone)] pub struct CacheManager<RT: Runtime> { rt: RT, database: Database<RT>, function_router: FunctionRouter<RT>, udf_execution: FunctionExecutionLog<RT>, instance_id: InstanceId, cache: QueryCache, } #[derive(Copy, Clone, Eq, PartialEq, Hash, Debug)] struct InstanceId(u32); impl InstanceId { fn allocate() -> Self { static NEXT_INSTANCE_ID: AtomicU32 = AtomicU32::new(0); let id = NEXT_INSTANCE_ID.fetch_add(1, Ordering::SeqCst); assert_ne!(id, u32::MAX, "instance id overflow"); InstanceId(id) } } /// A cache key representing a specific query request, before it runs. /// It may have more specific information than a `StoredCacheKey`, because /// multiple query requests may be served by the same cache entry. /// e.g. if a query does not check `ctx.auth`, then `RequestedCacheKey` /// contains the identity, but `StoredCacheKey` does not. #[derive(Clone, Eq, PartialEq, Hash, Debug)] pub struct RequestedCacheKey { instance: InstanceId, path: PublicFunctionPath, args: ConvexArray, identity: IdentityCacheKey, journal: QueryJournal, allowed_visibility: AllowedVisibility, } impl RequestedCacheKey { // In order from most specific to least specific. fn _possible_cache_keys(&self) -> Vec<StoredCacheKey> { vec![ self.precise_cache_key(), StoredCacheKey { instance: self.instance, path: self.path.clone(), args: self.args.clone(), // Include queries that did not read `ctx.auth`. identity: None, journal: self.journal.clone(), allowed_visibility: self.allowed_visibility, }, ] } fn precise_cache_key(&self) -> StoredCacheKey { StoredCacheKey { instance: self.instance, path: self.path.clone(), args: self.args.clone(), identity: Some(self.identity.clone()), journal: self.journal.clone(), allowed_visibility: self.allowed_visibility, } } fn get_cache_entry<'a>( &'a self, cache: &'a mut LruCache<StoredCacheKey, CacheEntry>, stored_key_hint: Option<&'_ StoredCacheKey>, ) -> (Option<&'a CacheEntry>, StoredCacheKey) { for key in self._possible_cache_keys() { if cache.contains(&key) { return (Some(cache.get(&key).unwrap()), key); } } if let Some(stored_key_hint) = stored_key_hint { assert!(self._possible_cache_keys().contains(stored_key_hint)); (None, stored_key_hint.clone()) } else { (None, self.precise_cache_key()) } } fn cache_keys_after_execution(&self, outcome: &UdfOutcome) -> SmallVec<[StoredCacheKey; 2]> { let identity = if outcome.observed_identity { Some(self.identity.clone()) } else { None }; let key = StoredCacheKey { instance: self.instance, path: self.path.clone(), args: self.args.clone(), identity, journal: self.journal.clone(), allowed_visibility: self.allowed_visibility, }; if self.journal != outcome.journal { // Record the result under *both* the original journal and the new // journal, as we expect re-executing the query with // `outcome.journal` to return the same result. // // This would typically happen if `self.journal` is empty (e.g. a // fresh caller starting a new paginated query), in which case // `outcome.journal` would contain a newly created journal. We want // to be able to cache requests from both the _same_ caller (who // will make their next request using `outcome.journal`) and from // new callers (who will use an empty journal). // // The journal could also change if the query starts paginating over // a different range of the table or a different table entirely. smallvec![ StoredCacheKey { journal: outcome.journal.clone(), ..key.clone() }, key ] } else { smallvec![key] } } } /// A cache key representing a persisted query result. #[derive(Clone, Eq, PartialEq, Hash, Debug)] pub struct StoredCacheKey { instance: InstanceId, path: PublicFunctionPath, args: ConvexArray, // None means that the query did not read `ctx.auth`. identity: Option<IdentityCacheKey>, journal: QueryJournal, allowed_visibility: AllowedVisibility, } impl StoredCacheKey { /// Approximate size in-memory of the CacheEntry structure, including stack /// and heap allocated memory. fn size(&self) -> usize { mem::size_of::<Self>() + self.path.heap_size() + self.args.heap_size() + self.identity.heap_size() + self.journal.heap_size() } } enum CacheEntry { Ready(CacheResult), Waiting { id: u64, started: tokio::time::Instant, receiver: Receiver<CacheResult>, // The UDF is being executed at this timestamp. ts: Timestamp, }, } impl CacheEntry { /// Approximate size in-memory of the CacheEntry structure, including stack /// and heap allocated memory. fn size(&self) -> usize { mem::size_of::<Self>() + match self { CacheEntry::Ready(ref result) => result.heap_size(), // This is an under count since there might be something in the receiver. // However, this is kind of hard to measure, and we expect this to // be the exception, not the rule. CacheEntry::Waiting { .. } => 0, } } } #[derive(Clone)] struct CacheResult { outcome: Arc<UdfOutcome>, original_ts: Timestamp, token: Token, } impl HeapSize for CacheResult { fn heap_size(&self) -> usize { self.outcome.heap_size() + self.original_ts.heap_size() + self.token.heap_size() } } impl<RT: Runtime> CacheManager<RT> { pub fn new( rt: RT, database: Database<RT>, function_router: FunctionRouter<RT>, udf_execution: FunctionExecutionLog<RT>, cache: QueryCache, ) -> Self { // each `CacheManager` (for a different instance) gets its own cache key space // within `Cache`, which has a _global_ size-limit let instance_id = InstanceId::allocate(); Self { rt, database, function_router, udf_execution, instance_id, cache, } } /// Execute a UDF with the given arguments and identity at a particular /// timestamp. This function internally handles LRU caching these /// function executions and ensuring that served cache values are /// consistent as of the given timestamp. #[fastrace::trace] pub async fn get( &self, request_id: RequestId, path: PublicFunctionPath, args: ConvexArray, identity: Identity, ts: Timestamp, journal: Option<QueryJournal>, caller: FunctionCaller, usage_tracker: FunctionUsageTracker, ) -> anyhow::Result<QueryReturn> { let timer = get_timer(); let result = self ._get( request_id, path, args, identity, ts, journal, caller, usage_tracker, ) .await; match &result { Ok((query_return, is_cache_hit)) => { succeed_get_timer( timer, *is_cache_hit, query_return.journal.end_cursor.is_some(), ); }, Err(e) => { timer.finish_with(e.metric_status_label_value()); }, } Ok(result?.0) } async fn _get( &self, request_id: RequestId, path: PublicFunctionPath, args: ConvexArray, identity: Identity, ts: Timestamp, journal: Option<QueryJournal>, caller: FunctionCaller, usage_tracker: FunctionUsageTracker, ) -> anyhow::Result<(QueryReturn, bool)> { let start = self.rt.monotonic_now(); let identity_cache_key = identity.cache_key(); let requested_key = RequestedCacheKey { instance: self.instance_id, path, args, identity: identity_cache_key, journal: journal.unwrap_or_else(QueryJournal::new), allowed_visibility: caller.allowed_visibility(), }; let context = ExecutionContext::new(request_id, &caller); // If the query exists at some cache key, but the cached entry is invalid, // create a Waiting entry at that key, even if it's not the most precise for the // request. e.g. if the query was cached with identity:None, create a // Waiting entry with identity:None so other queries with other // identities will wait for us to finish. This requires keeping // `stored_key_hint` across iterations, since finding an invalid key // removes it from the cache and continues the loop. let mut stored_key_hint = None; let mut num_attempts = 0; 'top: loop { num_attempts += 1; let now = self.rt.monotonic_now(); // Bound the total time of the caching algorithm in cases we wait to // long before we start executing. If there is slowdown, we prefer to // fast fail instead of adding additional load to the system. let elapsed = now - start; anyhow::ensure!( elapsed <= *TOTAL_QUERY_TIMEOUT, "Query execution time out: {elapsed:?}", ); // Step 1: Decide what we're going to do this iteration: use a cached value, // wait on someone else to run a UDF, or run the UDF ourselves. let maybe_op = self.cache.plan_cache_op( &requested_key, stored_key_hint.as_ref(), start, now, &identity, ts, context.clone(), ); let (op, stored_key) = match maybe_op { Some(op_key) => op_key, None => continue 'top, }; stored_key_hint = Some(stored_key.clone()); // Create a waiting entry in order to guarantee the waiting entry always // get cleaned up if the current future returns an error or gets dropped. let waiting_entry_id = match op { CacheOp::Go { waiting_entry_id, .. } => waiting_entry_id, _ => None, }; let mut waiting_entry_guard = WaitingEntryGuard::new(waiting_entry_id, &stored_key, self.cache.clone()); // Step 2: Perform our cache operation, potentially running the UDF. let is_cache_hit = match op { // Serving from cache. CacheOp::Ready { .. } => true, // We either use a result from the cache or we continue from 'top // after Step 2 without logging. CacheOp::Wait { .. } => true, // We are executing ourselves. CacheOp::Go { .. } => false, }; let (result, table_stats) = match self .perform_cache_op(&requested_key, &stored_key, op, usage_tracker.clone()) .await? { Some(r) => r, None => continue 'top, }; // Step 3: Validate that the cache result we got is good enough. Is our desired // timestamp in its validity interval? If it looked at system time, is it not // too old? let cache_result = match self.validate_cache_result(&stored_key, ts, result).await? { Some(r) => r, None => continue 'top, }; // Step 4: Rewrite the value into the cache. If this was a cache hit, this will // bump the cache result's token. This method will discard the new value if the // UDF failed or if a newer (i.e. higher `original_ts`) value is in the cache. if cache_result.outcome.result.is_ok() { // We do not cache JSErrors let actual_stored_keys = requested_key.cache_keys_after_execution(&cache_result.outcome); waiting_entry_guard.complete(actual_stored_keys, cache_result.clone()); } else { drop(waiting_entry_guard); } // Step 5: Log some stuff and return. log_success(num_attempts); let usage_stats = usage_tracker.clone().gather_user_stats(); let database_bandwidth_bytes = usage_stats.database_egress_size.values().sum(); log_query_bandwidth_bytes( cache_result.outcome.journal.end_cursor.is_some(), database_bandwidth_bytes, ); self.udf_execution .log_query( &cache_result.outcome, table_stats, is_cache_hit, start.elapsed(), caller, usage_tracker, context.clone(), ) .await; let result = QueryReturn { result: cache_result.outcome.result.clone(), log_lines: cache_result.outcome.log_lines.clone(), token: cache_result.token, journal: cache_result.outcome.journal.clone(), }; return Ok((result, is_cache_hit)); } } #[fastrace::trace] async fn perform_cache_op( &self, requested_key: &RequestedCacheKey, key: &StoredCacheKey, op: CacheOp<'_>, usage_tracker: FunctionUsageTracker, ) -> anyhow::Result<Option<(CacheResult, BTreeMap<TableName, TableStats>)>> { let pause_client = self.rt.pause_client(); pause_client.wait("perform_cache_op").await; let r = match op { CacheOp::Ready { result } => { if result.outcome.result.is_err() { panic!("Developer error: Cache contained failed execution for {key:?}") } (result, BTreeMap::new()) }, CacheOp::Wait { waiting_entry_id, mut receiver, remaining, } => { let result = select_biased! { maybe_result = receiver.recv().fuse() => match maybe_result { Err(..) => { // The peer working on the cache entry went away (perhaps due to an // error), so remove its entry and retry. self.cache.remove_waiting(key, waiting_entry_id); log_perform_wait_peer_timeout(); return Ok(None) }, Ok(r) => r, }, // We checked in `plan_cache_op` that the peer hadn't timed out with respect to // its start time, so timing out here means that we're on a retry and ran out of // our time ourselves. Therefore, don't remove the cache entry in this // condition. _ = self.rt.wait(remaining).fuse() => { log_perform_wait_self_timeout(); return Ok(None) }, }; if result.outcome.result.is_err() { panic!("Developer error: CacheOp::Go sent failed execution for {key:?}") } (result, BTreeMap::new()) }, CacheOp::Go { waiting_entry_id: _, sender, path, args, identity, ts, journal, allowed_visibility, context, } => { let mut tx = self .database .begin_with_ts(identity.clone(), ts, usage_tracker) .await?; // We are validating UDF visibility here as opposed to earlier so the validation // checks are transactional with running the query. This is safe because we will // never serve a result based of a stale visibility check since the data read as // part of the visibility check is part of the ReadSet for this query. let validate_result = ValidatedPathAndArgs::new_with_returns_validator( allowed_visibility, &mut tx, path.clone(), args.clone(), UdfType::Query, ) .await?; let (mut tx, query_outcome) = match validate_result { Err(js_err) => { let query_outcome = UdfOutcome::from_error( js_err, path.clone().debug_into_component_path(), args.clone(), identity.clone().into(), self.rt.clone(), None, )?; (tx, query_outcome) }, Ok((path_and_args, returns_validator)) => { let component = path_and_args.path().component; let (mut tx, outcome) = self .function_router .execute_query_or_mutation( tx, path_and_args, UdfType::Query, journal.clone(), context, ) .await?; let FunctionOutcome::Query(mut query_outcome) = outcome else { anyhow::bail!("Received non-query outcome when executing a query") }; if let Ok(ref json_packed_value) = &query_outcome.result { let output: ConvexValue = json_packed_value.unpack(); let table_mapping = tx.table_mapping().namespace(component.into()); let virtual_system_mapping = tx.virtual_system_mapping(); let returns_validation_error = returns_validator.check_output( &output, &table_mapping, virtual_system_mapping, ); if let Some(js_err) = returns_validation_error { query_outcome.result = Err(js_err); } } (tx, query_outcome) }, }; let ts = tx.begin_timestamp(); let table_stats = tx.take_stats(); let token = tx.into_token()?; let result = CacheResult { outcome: Arc::new(query_outcome), original_ts: *ts, token, }; if result.outcome.result.is_ok() && requested_key .cache_keys_after_execution(&result.outcome) .contains(key) { let _: Result<_, _> = sender.try_broadcast(result.clone()); } else { // Send an error to receivers so any waiting peers will retry. drop(sender); } log_perform_go(result.outcome.result.is_ok()); (result, table_stats) }, }; Ok(Some(r)) } #[fastrace::trace] async fn validate_cache_result( &self, key: &StoredCacheKey, ts: Timestamp, mut result: CacheResult, ) -> anyhow::Result<Option<CacheResult>> { if ts < result.original_ts { // If the cached value is newer than the requested timestamp, // we have to re-execute the UDF. log_validate_ts_too_old(); return Ok(None); } result.token = match self.database.refresh_token(result.token, ts).await? { Ok(t) => t, Err(_invalid_ts) => { tracing::debug!( "Couldn't refresh cache entry from {} to {}, retrying...", result.original_ts, ts ); self.cache.remove_ready(key, result.original_ts); log_validate_refresh_failed(); return Ok(None); }, }; if result.outcome.observed_time { let sys_now = self.rt.unix_timestamp(); let cached_time = result.outcome.unix_timestamp; match sys_now.checked_sub(cached_time) { Some(entry_age) if entry_age > MAX_CACHE_AGE => { tracing::debug!( "Log entry for {:?} used system time and is too old ({:?}), retrying...", key, entry_age ); self.cache.remove_ready(key, result.original_ts); log_validate_system_time_too_old(); return Ok(None); }, None => { tracing::warn!( "Cached value's timestamp {:?} is in the future (now: {:?})?", cached_time, sys_now, ); self.cache.remove_ready(key, result.original_ts); log_validate_system_time_in_the_future(); return Ok(None); }, Some(..) => (), } } Ok(Some(result)) } } // A wrapper struct that makes sure that the waiting entry always gets removed // when the performing operation is dropped, even if the caller future gets // canceled. struct WaitingEntryGuard<'a> { entry_id: Option<u64>, key: &'a StoredCacheKey, cache: QueryCache, } impl<'a> WaitingEntryGuard<'a> { fn new(entry_id: Option<u64>, key: &'a StoredCacheKey, cache: QueryCache) -> Self { Self { entry_id, key, cache, } } // Marks the waiting entry as removed, so we don't have to remove it on Drop fn complete(&mut self, actual_stored_keys: SmallVec<[StoredCacheKey; 2]>, result: CacheResult) { if let Some(entry_id) = self.entry_id.take() { self.cache.remove_waiting(self.key, entry_id); self.cache.put_ready(actual_stored_keys, result); } } } impl Drop for WaitingEntryGuard<'_> { fn drop(&mut self) { // Remove the cache entry from the cache if still present. if let Some(entry_id) = self.entry_id { self.cache.remove_waiting(self.key, entry_id) } } } struct Inner { cache: LruCache<StoredCacheKey, CacheEntry>, size: usize, size_limit: usize, next_waiting_id: u64, } #[derive(Clone)] pub struct QueryCache { inner: Arc<Mutex<Inner>>, } impl QueryCache { pub fn new(size_limit: usize) -> Self { let inner = Inner { cache: LruCache::unbounded(), size: 0, next_waiting_id: 0, size_limit, }; Self { inner: Arc::new(Mutex::new(inner)), } } fn plan_cache_op<'a>( &self, key: &'a RequestedCacheKey, stored_key_hint: Option<&'_ StoredCacheKey>, start: tokio::time::Instant, now: tokio::time::Instant, identity: &'a Identity, ts: Timestamp, context: ExecutionContext, ) -> Option<(CacheOp<'a>, StoredCacheKey)> { let go = |sender: Option<(Sender<_>, u64)>| { let (sender, waiting_entry_id) = match sender { Some((sender, waiting_entry_id)) => (sender, Some(waiting_entry_id)), None => { // No one should wait for this, so it's okay to drop the // receiver. And the sender ignores errors. let (sender, _) = broadcast(1); (sender, None) }, }; CacheOp::Go { waiting_entry_id, sender, path: &key.path, args: &key.args, identity, ts, journal: &key.journal, allowed_visibility: key.allowed_visibility, context, } }; let mut inner = self.inner.lock(); let (entry, stored_key) = key.get_cache_entry(&mut inner.cache, stored_key_hint); let op = match entry { Some(CacheEntry::Ready(r)) => { if ts < r.original_ts { // If another request has already executed this UDF at a // newer timestamp, we can't use the cache. Re-execute // in this case. tracing::debug!("Cache value too new for {:?}", stored_key); log_plan_go(GoReason::PeerTimestampTooNew); go(None) } else { tracing::debug!("Cache value ready for {:?}", stored_key); log_plan_ready(); CacheOp::Ready { result: r.clone() } } }, Some(CacheEntry::Waiting { id, started: peer_started, receiver, ts: peer_ts, }) => { let entry_id = *id; if *peer_ts > ts { log_plan_go(GoReason::PeerTimestampTooNew); return Some((go(None), stored_key)); } // We don't serialize sampling `now` under the cache lock, and since it can // occur on different threads, we're not guaranteed that // `peer_started < now`. So, if the peer started *after* us, // consider its `peer_elapsed` time to be zero. let peer_started = cmp::min(now, *peer_started); let peer_elapsed = now - peer_started; if peer_elapsed >= *TOTAL_QUERY_TIMEOUT { tracing::debug!( "Peer timed out ({:?}), removing cache entry and retrying", peer_elapsed ); inner.remove_waiting(&stored_key, entry_id); log_plan_peer_timeout(); return None; } let get_elapsed = now - start; let remaining = *TOTAL_QUERY_TIMEOUT - cmp::max(peer_elapsed, get_elapsed); tracing::debug!("Waiting for peer to compute {:?}", stored_key); log_plan_wait(); CacheOp::Wait { waiting_entry_id: *id, receiver: receiver.clone(), remaining, } }, None => { tracing::debug!("No cache value for {:?}, executing UDF...", stored_key); let (sender, executor_id) = inner.put_waiting(stored_key.clone(), now, ts); log_plan_go(GoReason::NoCacheResult); go(Some((sender, executor_id))) }, }; Some((op, stored_key)) } fn remove_waiting(&self, key: &StoredCacheKey, entry_id: u64) { self.inner.lock().remove_waiting(key, entry_id) } fn remove_ready(&self, key: &StoredCacheKey, original_ts: Timestamp) { self.inner.lock().remove_ready(key, original_ts) } fn put_ready(&self, keys: SmallVec<[StoredCacheKey; 2]>, result: CacheResult) { let mut inner = self.inner.lock(); for (result, key) in iter::repeat_n(result, keys.len()).zip(keys) { inner.put_ready(key, result); } } } impl Inner { // Remove only a `CacheEntry::Ready` from the cache, predicated on its // `executor_id` matching. fn remove_waiting(&mut self, key: &StoredCacheKey, entry_id: u64) { match self.cache.get(key) { Some(CacheEntry::Waiting { id, .. }) if *id == entry_id => { let (actual_key, entry) = self.cache.pop_entry(key).unwrap(); self.size -= actual_key.size() + entry.size(); }, _ => (), } log_cache_size(self.size) } // Remove only a `CacheEntry::Ready` from the cache, predicated on its // `original_ts` matching. fn remove_ready(&mut self, key: &StoredCacheKey, original_ts: Timestamp) { match self.cache.get(key) { Some(CacheEntry::Ready(ref result)) if result.original_ts == original_ts => { let (actual_key, entry) = self.cache.pop_entry(key).unwrap(); self.size -= actual_key.size() + entry.size(); }, _ => (), } log_cache_size(self.size); } fn put_waiting( &mut self, key: StoredCacheKey, now: tokio::time::Instant, ts: Timestamp, ) -> (Sender<CacheResult>, u64) { let id = self.next_waiting_id; self.next_waiting_id += 1; let (sender, receiver) = broadcast(1); let new_entry = CacheEntry::Waiting { id, receiver, started: now, ts, }; let new_size = key.size() + new_entry.size(); let old_size = self .cache .push(key, new_entry) .map(|(old_key, old_value)| old_key.size() + old_value.size()) .unwrap_or(0); // N.B.: `self.size - old_size` could be _negative_ if `key.size()` was larger // than the size of the preexisting key; therefore add before subtracting self.size = self.size + new_size - old_size; self.enforce_size_limit(); (sender, id) } // Put a `CacheEntry::Ready` into the cache, potentially dropping it if there's // already a value with a higher `original_ts`. fn put_ready(&mut self, key: StoredCacheKey, result: CacheResult) { match self.cache.get_mut(&key) { Some(entry @ CacheEntry::Waiting { .. }) => { let new_entry = CacheEntry::Ready(result); self.size -= entry.size(); self.size += new_entry.size(); *entry = new_entry; }, Some(CacheEntry::Ready(ref mut existing_result)) => { if existing_result.original_ts < result.original_ts || (existing_result.original_ts == result.original_ts && existing_result.token.ts() < result.token.ts()) { self.size -= existing_result.heap_size(); self.size += result.heap_size(); *existing_result = result; } else { tracing::debug!( "dropping cache result for {key:?} because result timestamp {} <= cached \ timestamp {}", result.original_ts, existing_result.original_ts ); log_drop_cache_result_too_old(); } }, None => { let new_entry = CacheEntry::Ready(result); self.size += key.size() + new_entry.size(); self.cache.put(key, new_entry); }, } self.enforce_size_limit(); } /// Pop records until the cache is under the given size. fn enforce_size_limit(&mut self) { while self.size > self.size_limit { let (popped_key, popped_entry) = self .cache .pop_lru() .expect("Cache is too large without any items?"); self.size -= popped_key.size() + popped_entry.size(); if let CacheEntry::Ready(r) = popped_entry { let system_time: SystemTime = r.token.ts().into(); if let Ok(t) = system_time.elapsed() { query_cache_log_eviction(t); } } } log_cache_size(self.size) } } enum CacheOp<'a> { Ready { result: CacheResult, }, Wait { waiting_entry_id: u64, receiver: Receiver<CacheResult>, remaining: Duration, }, Go { waiting_entry_id: Option<u64>, sender: Sender<CacheResult>, path: &'a PublicFunctionPath, args: &'a ConvexArray, identity: &'a Identity, ts: Timestamp, journal: &'a QueryJournal, allowed_visibility: AllowedVisibility, context: ExecutionContext, }, } #[cfg(test)] mod tests { use std::{ path::PathBuf, sync::Arc, }; use common::{ components::{ ExportPath, PublicFunctionPath, }, identity::IdentityCacheKey, index::IndexKeyBytes, query::{ Cursor, CursorPosition, }, query_journal::QueryJournal, types::AllowedVisibility, }; use database::Token; use proptest::{ prelude::{ Arbitrary, Strategy, }, strategy::ValueTree, test_runner::TestRunner, }; use smallvec::smallvec; use sync_types::{ CanonicalizedModulePath, CanonicalizedUdfPath, Timestamp, }; use tokio::time::Instant; use udf::UdfOutcome; use value::{ ConvexArray, ConvexValue, }; use super::{ CacheResult, InstanceId, QueryCache, StoredCacheKey, }; // Construct a cache key where as many fields as possible have extra capacity in // them fn make_cache_key() -> StoredCacheKey { macro_rules! with_extra_capacity { ($e:expr) => {{ let mut r = $e; r.reserve(100); r }}; } StoredCacheKey { instance: InstanceId(0), path: PublicFunctionPath::RootExport(ExportPath::from(CanonicalizedUdfPath::new( CanonicalizedModulePath::new( PathBuf::with_capacity(1 << 10), false, false, false, false, ), "function_name".parse().unwrap(), ))), args: ConvexArray::try_from(with_extra_capacity!(vec![ConvexValue::from(100.)])) .unwrap(), identity: Some(IdentityCacheKey::InstanceAdmin(with_extra_capacity!( "admin".to_string() ))), journal: QueryJournal { end_cursor: Some(Cursor { position: CursorPosition::After(IndexKeyBytes(with_extra_capacity!( b"key".to_vec() ))), query_fingerprint: with_extra_capacity!(b"fingerprint".to_vec()), }), }, allowed_visibility: AllowedVisibility::All, } } fn make_cache_result() -> CacheResult { let mut test_runner = TestRunner::deterministic(); CacheResult { outcome: Arc::new( UdfOutcome::arbitrary() .new_tree(&mut test_runner) .unwrap() .current(), ), original_ts: Timestamp::MIN, token: Token::arbitrary() .new_tree(&mut test_runner) .unwrap() .current(), } } #[test] fn test_put_waiting_excess_capacity() { let cache = QueryCache::new(usize::MAX); let cache_key = make_cache_key(); // Cloning the key effectively shrinks away the excess capacity let cloned_key = cache_key.clone(); assert_ne!(cache_key.size(), cloned_key.size()); let (_, id) = cache .inner .lock() .put_waiting(cloned_key, Instant::now(), Timestamp::MIN); assert!(cache.inner.lock().size > 0); cache.remove_waiting(&cache_key, id); assert_eq!(cache.inner.lock().size, 0); } #[test] fn test_put_ready_excess_capacity() { let cache = QueryCache::new(usize::MAX); let cache_key = make_cache_key(); let cloned_key = cache_key.clone(); assert_ne!(cache_key.size(), cloned_key.size()); cache.put_ready(smallvec![cloned_key], make_cache_result()); assert!(cache.inner.lock().size > 0); cache.remove_ready(&cache_key, Timestamp::MIN); assert_eq!(cache.inner.lock().size, 0); } }

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/get-convex/convex-backend'

If you have feedback or need assistance with the MCP directory API, please join our Discord server