use std::any::{Any, TypeId};
use std::sync::Arc;
use deepsize::{Context, DeepSizeOf};
use futures::Future;
use moka::sync::Cache;
use object_store::path::Path;
use crate::utils::path::LancePathExt;
use crate::Result;
type ArcAny = Arc<dyn Any + Send + Sync>;
#[derive(Clone)]
struct SizedRecord {
record: ArcAny,
size_accessor: Arc<dyn Fn(&ArcAny) -> usize + Send + Sync>,
}
impl std::fmt::Debug for SizedRecord {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
f.debug_struct("SizedRecord")
.field("record", &self.record)
.finish()
}
}
impl SizedRecord {
fn new<T: DeepSizeOf + Send + Sync + 'static>(record: Arc<T>) -> Self {
let size_accessor =
|record: &ArcAny| -> usize { record.downcast_ref::<T>().unwrap().deep_size_of() };
Self {
record,
size_accessor: Arc::new(size_accessor),
}
}
}
#[derive(Clone, Debug)]
pub struct FileMetadataCache {
cache: Option<Arc<Cache<(Path, TypeId), SizedRecord>>>,
base_path: Option<Path>,
}
impl DeepSizeOf for FileMetadataCache {
fn deep_size_of_children(&self, _: &mut Context) -> usize {
self.cache
.as_ref()
.map(|cache| {
cache
.iter()
.map(|(_, v)| (v.size_accessor)(&v.record))
.sum()
})
.unwrap_or(0)
}
}
pub enum CapacityMode {
Items,
Bytes,
}
impl FileMetadataCache {
pub fn new(capacity: usize) -> Self {
Self {
cache: Some(Arc::new(Cache::new(capacity as u64))),
base_path: None,
}
}
pub fn no_cache() -> Self {
Self {
cache: None,
base_path: None,
}
}
pub fn with_capacity(capacity: usize, mode: CapacityMode) -> Self {
match mode {
CapacityMode::Items => Self::new(capacity),
CapacityMode::Bytes => Self {
cache: Some(Arc::new(
Cache::builder()
.weigher(|_, v: &SizedRecord| {
(v.size_accessor)(&v.record).try_into().unwrap_or(u32::MAX)
})
.build(),
)),
base_path: None,
},
}
}
pub fn with_base_path(&self, base_path: Path) -> Self {
Self {
cache: self.cache.clone(),
base_path: Some(base_path),
}
}
pub fn size(&self) -> usize {
if let Some(cache) = self.cache.as_ref() {
cache.run_pending_tasks();
cache.entry_count() as usize
} else {
0
}
}
pub fn get<T: Send + Sync + 'static>(&self, path: &Path) -> Option<Arc<T>> {
let cache = self.cache.as_ref()?;
let temp: Path;
let path = if let Some(base_path) = &self.base_path {
temp = base_path.child_path(path);
&temp
} else {
path
};
cache
.get(&(path.to_owned(), TypeId::of::<T>()))
.map(|metadata| metadata.record.clone().downcast::<T>().unwrap())
}
pub fn insert<T: DeepSizeOf + Send + Sync + 'static>(&self, path: Path, metadata: Arc<T>) {
let Some(cache) = self.cache.as_ref() else {
return;
};
let path = if let Some(base_path) = &self.base_path {
base_path.child_path(&path)
} else {
path
};
cache.insert((path, TypeId::of::<T>()), SizedRecord::new(metadata));
}
pub async fn get_or_insert<T: DeepSizeOf + Send + Sync + 'static, F, Fut>(
&self,
path: &Path,
loader: F,
) -> Result<Arc<T>>
where
F: Fn(&Path) -> Fut,
Fut: Future<Output = Result<T>>,
{
if let Some(metadata) = self.get::<T>(path) {
return Ok(metadata);
}
let metadata = Arc::new(loader(path).await?);
self.insert(path.to_owned(), metadata.clone());
Ok(metadata)
}
}