mirror of
https://github.com/meilisearch/MeiliSearch
synced 2025-01-20 18:27:28 +01:00
Fix geosort bug
This commit is contained in:
parent
65e49b7092
commit
11e2a2c1aa
@ -107,12 +107,16 @@ impl<Q: RankingRuleQueryTrait> GeoSort<Q> {
|
|||||||
|
|
||||||
/// Refill the internal buffer of cached docids based on the strategy.
|
/// Refill the internal buffer of cached docids based on the strategy.
|
||||||
/// Drop the rtree if we don't need it anymore.
|
/// Drop the rtree if we don't need it anymore.
|
||||||
fn fill_buffer(&mut self, ctx: &mut SearchContext) -> Result<()> {
|
fn fill_buffer(
|
||||||
|
&mut self,
|
||||||
|
ctx: &mut SearchContext,
|
||||||
|
geo_candidates: &RoaringBitmap,
|
||||||
|
) -> Result<()> {
|
||||||
debug_assert!(self.field_ids.is_some(), "fill_buffer can't be called without the lat&lng");
|
debug_assert!(self.field_ids.is_some(), "fill_buffer can't be called without the lat&lng");
|
||||||
debug_assert!(self.cached_sorted_docids.is_empty());
|
debug_assert!(self.cached_sorted_docids.is_empty());
|
||||||
|
|
||||||
// lazily initialize the rtree if needed by the strategy, and cache it in `self.rtree`
|
// lazily initialize the rtree if needed by the strategy, and cache it in `self.rtree`
|
||||||
let rtree = if self.strategy.use_rtree(self.geo_candidates.len() as usize) {
|
let rtree = if self.strategy.use_rtree(geo_candidates.len() as usize) {
|
||||||
if let Some(rtree) = self.rtree.as_ref() {
|
if let Some(rtree) = self.rtree.as_ref() {
|
||||||
// get rtree from cache
|
// get rtree from cache
|
||||||
Some(rtree)
|
Some(rtree)
|
||||||
@ -131,7 +135,7 @@ impl<Q: RankingRuleQueryTrait> GeoSort<Q> {
|
|||||||
if self.ascending {
|
if self.ascending {
|
||||||
let point = lat_lng_to_xyz(&self.point);
|
let point = lat_lng_to_xyz(&self.point);
|
||||||
for point in rtree.nearest_neighbor_iter(&point) {
|
for point in rtree.nearest_neighbor_iter(&point) {
|
||||||
if self.geo_candidates.contains(point.data.0) {
|
if geo_candidates.contains(point.data.0) {
|
||||||
self.cached_sorted_docids.push_back(point.data);
|
self.cached_sorted_docids.push_back(point.data);
|
||||||
if self.cached_sorted_docids.len() >= cache_size {
|
if self.cached_sorted_docids.len() >= cache_size {
|
||||||
break;
|
break;
|
||||||
@ -143,7 +147,7 @@ impl<Q: RankingRuleQueryTrait> GeoSort<Q> {
|
|||||||
// and we insert the points in reverse order they get reversed when emptying the cache later on
|
// and we insert the points in reverse order they get reversed when emptying the cache later on
|
||||||
let point = lat_lng_to_xyz(&opposite_of(self.point));
|
let point = lat_lng_to_xyz(&opposite_of(self.point));
|
||||||
for point in rtree.nearest_neighbor_iter(&point) {
|
for point in rtree.nearest_neighbor_iter(&point) {
|
||||||
if self.geo_candidates.contains(point.data.0) {
|
if geo_candidates.contains(point.data.0) {
|
||||||
self.cached_sorted_docids.push_front(point.data);
|
self.cached_sorted_docids.push_front(point.data);
|
||||||
if self.cached_sorted_docids.len() >= cache_size {
|
if self.cached_sorted_docids.len() >= cache_size {
|
||||||
break;
|
break;
|
||||||
@ -155,8 +159,7 @@ impl<Q: RankingRuleQueryTrait> GeoSort<Q> {
|
|||||||
// the iterative version
|
// the iterative version
|
||||||
let [lat, lng] = self.field_ids.unwrap();
|
let [lat, lng] = self.field_ids.unwrap();
|
||||||
|
|
||||||
let mut documents = self
|
let mut documents = geo_candidates
|
||||||
.geo_candidates
|
|
||||||
.iter()
|
.iter()
|
||||||
.map(|id| -> Result<_> { Ok((id, geo_value(id, lat, lng, ctx.index, ctx.txn)?)) })
|
.map(|id| -> Result<_> { Ok((id, geo_value(id, lat, lng, ctx.index, ctx.txn)?)) })
|
||||||
.collect::<Result<Vec<(u32, [f64; 2])>>>()?;
|
.collect::<Result<Vec<(u32, [f64; 2])>>>()?;
|
||||||
@ -216,9 +219,10 @@ impl<'ctx, Q: RankingRuleQueryTrait> RankingRule<'ctx, Q> for GeoSort<Q> {
|
|||||||
assert!(self.query.is_none());
|
assert!(self.query.is_none());
|
||||||
|
|
||||||
self.query = Some(query.clone());
|
self.query = Some(query.clone());
|
||||||
self.geo_candidates &= universe;
|
|
||||||
|
|
||||||
if self.geo_candidates.is_empty() {
|
let geo_candidates = &self.geo_candidates & universe;
|
||||||
|
|
||||||
|
if geo_candidates.is_empty() {
|
||||||
return Ok(());
|
return Ok(());
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -226,7 +230,7 @@ impl<'ctx, Q: RankingRuleQueryTrait> RankingRule<'ctx, Q> for GeoSort<Q> {
|
|||||||
let lat = fid_map.id("_geo.lat").expect("geo candidates but no fid for lat");
|
let lat = fid_map.id("_geo.lat").expect("geo candidates but no fid for lat");
|
||||||
let lng = fid_map.id("_geo.lng").expect("geo candidates but no fid for lng");
|
let lng = fid_map.id("_geo.lng").expect("geo candidates but no fid for lng");
|
||||||
self.field_ids = Some([lat, lng]);
|
self.field_ids = Some([lat, lng]);
|
||||||
self.fill_buffer(ctx)?;
|
self.fill_buffer(ctx, &geo_candidates)?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -238,9 +242,10 @@ impl<'ctx, Q: RankingRuleQueryTrait> RankingRule<'ctx, Q> for GeoSort<Q> {
|
|||||||
universe: &RoaringBitmap,
|
universe: &RoaringBitmap,
|
||||||
) -> Result<Option<RankingRuleOutput<Q>>> {
|
) -> Result<Option<RankingRuleOutput<Q>>> {
|
||||||
let query = self.query.as_ref().unwrap().clone();
|
let query = self.query.as_ref().unwrap().clone();
|
||||||
self.geo_candidates &= universe;
|
|
||||||
|
|
||||||
if self.geo_candidates.is_empty() {
|
let geo_candidates = &self.geo_candidates & universe;
|
||||||
|
|
||||||
|
if geo_candidates.is_empty() {
|
||||||
return Ok(Some(RankingRuleOutput {
|
return Ok(Some(RankingRuleOutput {
|
||||||
query,
|
query,
|
||||||
candidates: universe.clone(),
|
candidates: universe.clone(),
|
||||||
@ -261,7 +266,7 @@ impl<'ctx, Q: RankingRuleQueryTrait> RankingRule<'ctx, Q> for GeoSort<Q> {
|
|||||||
}
|
}
|
||||||
};
|
};
|
||||||
while let Some((id, point)) = next(&mut self.cached_sorted_docids) {
|
while let Some((id, point)) = next(&mut self.cached_sorted_docids) {
|
||||||
if self.geo_candidates.contains(id) {
|
if geo_candidates.contains(id) {
|
||||||
return Ok(Some(RankingRuleOutput {
|
return Ok(Some(RankingRuleOutput {
|
||||||
query,
|
query,
|
||||||
candidates: RoaringBitmap::from_iter([id]),
|
candidates: RoaringBitmap::from_iter([id]),
|
||||||
@ -276,7 +281,7 @@ impl<'ctx, Q: RankingRuleQueryTrait> RankingRule<'ctx, Q> for GeoSort<Q> {
|
|||||||
|
|
||||||
// if we got out of this loop it means we've exhausted our cache.
|
// if we got out of this loop it means we've exhausted our cache.
|
||||||
// we need to refill it and run the function again.
|
// we need to refill it and run the function again.
|
||||||
self.fill_buffer(ctx)?;
|
self.fill_buffer(ctx, &geo_candidates)?;
|
||||||
self.next_bucket(ctx, logger, universe)
|
self.next_bucket(ctx, logger, universe)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user