MeiliSearch/milli/tests/search/distinct.rs

74 lines
2.9 KiB
Rust
Raw Normal View History

2021-06-17 14:24:59 +02:00
use std::collections::HashSet;
use big_s::S;
use milli::update::Settings;
use milli::{Criterion, Search, SearchResult};
use Criterion::*;
use crate::search::{self, EXTERNAL_DOCUMENTS_IDS};
macro_rules! test_distinct {
($func:ident, $distinct:ident, $criteria:expr) => {
#[test]
fn $func() {
let criteria = $criteria;
let index = search::setup_search_index_with_criteria(&criteria);
// update distinct attribute
let mut wtxn = index.write_txn().unwrap();
let config = milli::update::IndexerConfig::default();
let mut builder = Settings::new(&mut wtxn, &index, &config);
2021-06-17 14:24:59 +02:00
builder.set_distinct_field(S(stringify!($distinct)));
2021-11-03 13:12:01 +01:00
builder.execute(|_| ()).unwrap();
2021-06-17 14:24:59 +02:00
wtxn.commit().unwrap();
2021-06-17 15:19:03 +02:00
let rtxn = index.read_txn().unwrap();
2021-06-17 14:24:59 +02:00
2021-06-17 15:19:03 +02:00
let mut search = Search::new(&rtxn, &index);
2021-06-17 14:24:59 +02:00
search.query(search::TEST_QUERY);
search.limit(EXTERNAL_DOCUMENTS_IDS.len());
search.authorize_typos(true);
search.optional_words(true);
let SearchResult { documents_ids, .. } = search.execute().unwrap();
let mut distinct_values = HashSet::new();
2021-08-23 11:37:18 +02:00
let expected_external_ids: Vec<_> = search::expected_order(&criteria, true, true, &[])
2021-06-17 14:24:59 +02:00
.into_iter()
.filter_map(|d| {
if distinct_values.contains(&d.$distinct) {
None
} else {
distinct_values.insert(d.$distinct.to_owned());
Some(d.id)
}
})
.collect();
let documents_ids = search::internal_to_external_ids(&index, &documents_ids);
assert_eq!(documents_ids, expected_external_ids);
}
};
}
2021-06-17 15:19:03 +02:00
test_distinct!(
distinct_string_default_criteria,
tag,
vec![Words, Typo, Proximity, Attribute, Exactness]
);
test_distinct!(
distinct_number_default_criteria,
asc_desc_rank,
vec![Words, Typo, Proximity, Attribute, Exactness]
);
test_distinct!(distinct_string_criterion_words, tag, vec![Words]);
test_distinct!(distinct_number_criterion_words, asc_desc_rank, vec![Words]);
test_distinct!(distinct_string_criterion_words_typo, tag, vec![Words, Typo]);
test_distinct!(distinct_number_criterion_words_typo, asc_desc_rank, vec![Words, Typo]);
test_distinct!(distinct_string_criterion_words_proximity, tag, vec![Words, Proximity]);
2021-06-17 14:24:59 +02:00
test_distinct!(distinct_number_criterion_words_proximity, asc_desc_rank, vec![Words, Proximity]);
2021-06-17 15:19:03 +02:00
test_distinct!(distinct_string_criterion_words_attribute, tag, vec![Words, Attribute]);
2021-06-17 14:24:59 +02:00
test_distinct!(distinct_number_criterion_words_attribute, asc_desc_rank, vec![Words, Attribute]);
2021-06-17 15:19:03 +02:00
test_distinct!(distinct_string_criterion_words_exactness, tag, vec![Words, Exactness]);
2021-06-17 14:24:59 +02:00
test_distinct!(distinct_number_criterion_words_exactness, asc_desc_rank, vec![Words, Exactness]);