From 8ac5b765bc0d22dd8448e671c66529ca668e3389 Mon Sep 17 00:00:00 2001 From: Kerollmops Date: Mon, 4 Sep 2023 14:39:52 +0200 Subject: [PATCH] Fix synonyms normalization --- milli/src/update/settings.rs | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/milli/src/update/settings.rs b/milli/src/update/settings.rs index 023e09aa0..b0452315d 100644 --- a/milli/src/update/settings.rs +++ b/milli/src/update/settings.rs @@ -573,7 +573,7 @@ impl<'a, 't, 'u, 'i> Settings<'a, 't, 'u, 'i> { tokenizer .tokenize(text) .filter_map(|token| { - if token.is_word() { + if token.is_word() && !token.lemma().is_empty() { Some(token.lemma().to_string()) } else { None @@ -1443,7 +1443,7 @@ mod tests { index .update_settings_using_wtxn(&mut wtxn, |settings| { settings.set_synonyms(btreemap! { - "japanese".to_string() => vec!["ญี่ปุ่น", "ยี่ปุ่น"], + "japanese".to_string() => vec![S("ญี่ปุ่น"), S("ยี่ปุ่น")], }); }) .unwrap();