mirror of
https://github.com/meilisearch/MeiliSearch
synced 2024-11-23 05:14:27 +01:00
Introduce cache structures used with ranking rule graphs
This commit is contained in:
parent
864f6410ed
commit
23bf572dea
55
milli/src/search/new/ranking_rule_graph/edge_docids_cache.rs
Normal file
55
milli/src/search/new/ranking_rule_graph/edge_docids_cache.rs
Normal file
@ -0,0 +1,55 @@
|
|||||||
|
use std::collections::HashMap;
|
||||||
|
use std::marker::PhantomData;
|
||||||
|
|
||||||
|
use heed::RoTxn;
|
||||||
|
use roaring::RoaringBitmap;
|
||||||
|
|
||||||
|
use super::{EdgeDetails, EdgeIndex, RankingRuleGraph, RankingRuleGraphTrait};
|
||||||
|
use crate::new::db_cache::DatabaseCache;
|
||||||
|
use crate::new::BitmapOrAllRef;
|
||||||
|
use crate::{Index, Result};
|
||||||
|
|
||||||
|
pub struct EdgeDocidsCache<G: RankingRuleGraphTrait> {
|
||||||
|
pub cache: HashMap<EdgeIndex, RoaringBitmap>,
|
||||||
|
|
||||||
|
// TODO: There is a big difference between `cache`, which is always valid, and
|
||||||
|
// `empty_path_prefixes`, which is only accurate for a particular universe
|
||||||
|
// ALSO, we should have a universe-specific `empty_edge` to use
|
||||||
|
// pub empty_path_prefixes: HashSet<Vec<EdgeIndex>>,
|
||||||
|
_phantom: PhantomData<G>,
|
||||||
|
}
|
||||||
|
impl<G: RankingRuleGraphTrait> Default for EdgeDocidsCache<G> {
|
||||||
|
fn default() -> Self {
|
||||||
|
Self {
|
||||||
|
cache: Default::default(),
|
||||||
|
// empty_path_prefixes: Default::default(),
|
||||||
|
_phantom: Default::default(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
impl<G: RankingRuleGraphTrait> EdgeDocidsCache<G> {
|
||||||
|
pub fn get_edge_docids<'s, 'transaction>(
|
||||||
|
&'s mut self,
|
||||||
|
index: &Index,
|
||||||
|
txn: &'transaction RoTxn,
|
||||||
|
db_cache: &mut DatabaseCache<'transaction>,
|
||||||
|
edge_index: &EdgeIndex,
|
||||||
|
graph: &RankingRuleGraph<G>,
|
||||||
|
) -> Result<BitmapOrAllRef<'s>> {
|
||||||
|
if self.cache.contains_key(edge_index) {
|
||||||
|
return Ok(BitmapOrAllRef::Bitmap(&self.cache[edge_index]));
|
||||||
|
}
|
||||||
|
let edge = graph.get_edge(*edge_index).as_ref().unwrap();
|
||||||
|
|
||||||
|
match &edge.details {
|
||||||
|
EdgeDetails::Unconditional => Ok(BitmapOrAllRef::All),
|
||||||
|
EdgeDetails::Data(details) => {
|
||||||
|
let docids = G::compute_docids(index, txn, db_cache, details)?;
|
||||||
|
|
||||||
|
let _ = self.cache.insert(*edge_index, docids);
|
||||||
|
let docids = &self.cache[edge_index];
|
||||||
|
Ok(BitmapOrAllRef::Bitmap(docids))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
23
milli/src/search/new/ranking_rule_graph/empty_paths_cache.rs
Normal file
23
milli/src/search/new/ranking_rule_graph/empty_paths_cache.rs
Normal file
@ -0,0 +1,23 @@
|
|||||||
|
use std::collections::HashSet;
|
||||||
|
|
||||||
|
use super::{paths_map::PathsMap, EdgeIndex};
|
||||||
|
|
||||||
|
#[derive(Default)]
|
||||||
|
pub struct EmptyPathsCache {
|
||||||
|
pub empty_edges: HashSet<EdgeIndex>,
|
||||||
|
pub empty_prefixes: PathsMap<()>,
|
||||||
|
}
|
||||||
|
impl EmptyPathsCache {
|
||||||
|
pub fn path_is_empty(&self, path: &[EdgeIndex]) -> bool {
|
||||||
|
for edge in path {
|
||||||
|
// TODO: should be a bitmap intersection
|
||||||
|
if self.empty_edges.contains(edge) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
if self.empty_prefixes.contains_prefix_of_path(path) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
false
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in New Issue
Block a user