From 60ddd534390e5a80f4fde0b2dc1de542dc57eeda Mon Sep 17 00:00:00 2001 From: Kerollmops Date: Mon, 12 Jun 2023 11:39:31 +0200 Subject: [PATCH] Return one of the original facet values when doing a facet search --- milli/src/search/mod.rs | 36 ++++++++++++++++++++++++++++++------ 1 file changed, 30 insertions(+), 6 deletions(-) diff --git a/milli/src/search/mod.rs b/milli/src/search/mod.rs index 1590fac41..e05562f8e 100644 --- a/milli/src/search/mod.rs +++ b/milli/src/search/mod.rs @@ -14,8 +14,8 @@ use crate::error::UserError; use crate::heed_codec::facet::{FacetGroupKey, FacetGroupValue}; use crate::score_details::{ScoreDetails, ScoringStrategy}; use crate::{ - execute_search, normalize_facet, AscDesc, DefaultSearchLogger, DocumentId, Index, Result, - SearchContext, BEU16, + execute_search, normalize_facet, AscDesc, DefaultSearchLogger, DocumentId, FieldId, Index, + Result, SearchContext, BEU16, }; // Building these factories is not free. @@ -259,6 +259,18 @@ impl<'a> SearchForFacetValues<'a> { self } + fn one_original_value_of( + &self, + field_id: FieldId, + facet_str: &str, + any_docid: DocumentId, + ) -> Result> { + let index = self.search_query.index; + let rtxn = self.search_query.rtxn; + let key: (FieldId, _, &str) = (field_id, any_docid, facet_str); + Ok(index.field_id_docid_facet_strings.get(rtxn, &key)?.map(|v| v.to_owned())) + } + pub fn execute(&self) -> Result> { let index = self.search_query.index; let rtxn = self.search_query.rtxn; @@ -306,7 +318,10 @@ impl<'a> SearchForFacetValues<'a> { { let count = search_candidates.intersection_len(&bitmap); if count != 0 { - results.push(FacetValueHit { value: query.to_string(), count }); + let value = self + .one_original_value_of(fid, query, bitmap.min().unwrap())? + .unwrap_or_else(|| query.to_string()); + results.push(FacetValueHit { value, count }); } } } else { @@ -338,7 +353,10 @@ impl<'a> SearchForFacetValues<'a> { }; let count = search_candidates.intersection_len(&docids); if count != 0 { - results.push(FacetValueHit { value: value.to_string(), count }); + let value = self + .one_original_value_of(fid, value, docids.min().unwrap())? + .unwrap_or_else(|| query.to_string()); + results.push(FacetValueHit { value, count }); length += 1; } if length >= MAX_NUMBER_OF_FACETS { @@ -367,7 +385,10 @@ impl<'a> SearchForFacetValues<'a> { }; let count = search_candidates.intersection_len(&docids); if count != 0 { - results.push(FacetValueHit { value: value.to_string(), count }); + let value = self + .one_original_value_of(fid, value, docids.min().unwrap())? + .unwrap_or_else(|| query.to_string()); + results.push(FacetValueHit { value, count }); length += 1; } if length >= MAX_NUMBER_OF_FACETS { @@ -387,7 +408,10 @@ impl<'a> SearchForFacetValues<'a> { result?; let count = search_candidates.intersection_len(&bitmap); if count != 0 { - results.push(FacetValueHit { value: left_bound.to_string(), count }); + let value = self + .one_original_value_of(fid, left_bound, bitmap.min().unwrap())? + .unwrap_or_else(|| left_bound.to_string()); + results.push(FacetValueHit { value, count }); length += 1; } if length >= MAX_NUMBER_OF_FACETS {