mirror of
https://github.com/meilisearch/MeiliSearch
synced 2025-01-07 12:04:30 +01:00
7745cc9d3c
3921: Deactivate camel case segmentation r=dureuill a=ManyTheFish # Pull Request This PR deactivates the camel case segmentation to retrieve the possibility to accept typos over camel-cased words ## Related issue Fixes #3869 Fixes #3818 ## What does this PR do? - deactivates camelcase segmentation related to #3919 Co-authored-by: ManyTheFish <many@meilisearch.com>
338 lines
9.6 KiB
Rust
338 lines
9.6 KiB
Rust
use meili_snap::{json_string, snapshot};
|
|
use once_cell::sync::Lazy;
|
|
use serde_json::{json, Value};
|
|
|
|
use crate::common::index::Index;
|
|
use crate::common::Server;
|
|
|
|
async fn index_with_documents<'a>(server: &'a Server, documents: &Value) -> Index<'a> {
|
|
let index = server.index("test");
|
|
|
|
index.add_documents(documents.clone(), None).await;
|
|
index.wait_task(0).await;
|
|
index
|
|
}
|
|
|
|
static SIMPLE_SEARCH_DOCUMENTS: Lazy<Value> = Lazy::new(|| {
|
|
json!([
|
|
{
|
|
"title": "Shazam!",
|
|
"desc": "a Captain Marvel ersatz",
|
|
"id": "1",
|
|
},
|
|
{
|
|
"title": "Captain Planet",
|
|
"desc": "He's not part of the Marvel Cinematic Universe",
|
|
"id": "2",
|
|
},
|
|
{
|
|
"title": "Captain Marvel",
|
|
"desc": "a Shazam ersatz",
|
|
"id": "3",
|
|
}])
|
|
});
|
|
|
|
#[actix_rt::test]
|
|
async fn simple_search_on_title() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
// simple search should return 2 documents (ids: 2 and 3).
|
|
index
|
|
.search(
|
|
json!({"q": "Captain Marvel", "attributesToSearchOn": ["title"]}),
|
|
|response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"2");
|
|
},
|
|
)
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn search_no_searchable_attribute_set() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
index
|
|
.search(
|
|
json!({"q": "Captain Marvel", "attributesToSearchOn": ["unknown"]}),
|
|
|response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"0");
|
|
},
|
|
)
|
|
.await;
|
|
|
|
index.update_settings_searchable_attributes(json!(["*"])).await;
|
|
index.wait_task(1).await;
|
|
|
|
index
|
|
.search(
|
|
json!({"q": "Captain Marvel", "attributesToSearchOn": ["unknown"]}),
|
|
|response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"0");
|
|
},
|
|
)
|
|
.await;
|
|
|
|
index.update_settings_searchable_attributes(json!(["*"])).await;
|
|
index.wait_task(2).await;
|
|
|
|
index
|
|
.search(
|
|
json!({"q": "Captain Marvel", "attributesToSearchOn": ["unknown", "title"]}),
|
|
|response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"2");
|
|
},
|
|
)
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn search_on_all_attributes() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
index
|
|
.search(json!({"q": "Captain Marvel", "attributesToSearchOn": ["*"]}), |response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"3");
|
|
})
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn search_on_all_attributes_restricted_set() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
index.update_settings_searchable_attributes(json!(["title"])).await;
|
|
index.wait_task(1).await;
|
|
|
|
index
|
|
.search(json!({"q": "Captain Marvel", "attributesToSearchOn": ["*"]}), |response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"2");
|
|
})
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn simple_prefix_search_on_title() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
// simple search should return 2 documents (ids: 2 and 3).
|
|
index
|
|
.search(json!({"q": "Captain Mar", "attributesToSearchOn": ["title"]}), |response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"2");
|
|
})
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn simple_search_on_title_matching_strategy_all() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
// simple search matching strategy all should only return 1 document (ids: 2).
|
|
index
|
|
.search(json!({"q": "Captain Marvel", "attributesToSearchOn": ["title"], "matchingStrategy": "all"}), |response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"1");
|
|
})
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn simple_search_on_no_field() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
// simple search on no field shouldn't return any document.
|
|
index
|
|
.search(json!({"q": "Captain Marvel", "attributesToSearchOn": []}), |response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"].as_array().unwrap().len(), @"0");
|
|
})
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn word_ranking_rule_order() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
// Document 3 should appear before document 2.
|
|
index
|
|
.search(
|
|
json!({"q": "Captain Marvel", "attributesToSearchOn": ["title"], "attributesToRetrieve": ["id"]}),
|
|
|response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(json_string!(response["hits"]),
|
|
@r###"
|
|
[
|
|
{
|
|
"id": "3"
|
|
},
|
|
{
|
|
"id": "2"
|
|
}
|
|
]
|
|
"###
|
|
);
|
|
},
|
|
)
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn word_ranking_rule_order_exact_words() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
index.update_settings_typo_tolerance(json!({"disableOnWords": ["Captain", "Marvel"]})).await;
|
|
index.wait_task(1).await;
|
|
|
|
// simple search should return 2 documents (ids: 2 and 3).
|
|
index
|
|
.search(
|
|
json!({"q": "Captain Marvel", "attributesToSearchOn": ["title"], "attributesToRetrieve": ["id"]}),
|
|
|response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(json_string!(response["hits"]),
|
|
@r###"
|
|
[
|
|
{
|
|
"id": "3"
|
|
},
|
|
{
|
|
"id": "2"
|
|
}
|
|
]
|
|
"###
|
|
);
|
|
},
|
|
)
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn typo_ranking_rule_order() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(
|
|
&server,
|
|
&json!([
|
|
{
|
|
"title": "Capitain Marivel",
|
|
"desc": "Captain Marvel",
|
|
"id": "1",
|
|
},
|
|
{
|
|
"title": "Captain Marivel",
|
|
"desc": "a Shazam ersatz",
|
|
"id": "2",
|
|
}]),
|
|
)
|
|
.await;
|
|
|
|
// Document 2 should appear before document 1.
|
|
index
|
|
.search(json!({"q": "Captain Marvel", "attributesToSearchOn": ["title"], "attributesToRetrieve": ["id"]}), |response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(json_string!(response["hits"]),
|
|
@r###"
|
|
[
|
|
{
|
|
"id": "2"
|
|
},
|
|
{
|
|
"id": "1"
|
|
}
|
|
]
|
|
"###
|
|
);
|
|
})
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn attributes_ranking_rule_order() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(
|
|
&server,
|
|
&json!([
|
|
{
|
|
"title": "Captain Marvel",
|
|
"desc": "a Shazam ersatz",
|
|
"footer": "The story of Captain Marvel",
|
|
"id": "1",
|
|
},
|
|
{
|
|
"title": "The Avengers",
|
|
"desc": "Captain Marvel is far from the earth",
|
|
"footer": "A super hero team",
|
|
"id": "2",
|
|
}]),
|
|
)
|
|
.await;
|
|
|
|
// Document 2 should appear before document 1.
|
|
index
|
|
.search(json!({"q": "Captain Marvel", "attributesToSearchOn": ["desc", "footer"], "attributesToRetrieve": ["id"]}), |response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(json_string!(response["hits"]),
|
|
@r###"
|
|
[
|
|
{
|
|
"id": "2"
|
|
},
|
|
{
|
|
"id": "1"
|
|
}
|
|
]
|
|
"###
|
|
);
|
|
})
|
|
.await;
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn exactness_ranking_rule_order() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(
|
|
&server,
|
|
&json!([
|
|
{
|
|
"title": "Captain Marvel",
|
|
"desc": "Captain Marivel",
|
|
"id": "1",
|
|
},
|
|
{
|
|
"title": "Captain Marvel",
|
|
"desc": "Captain the Marvel",
|
|
"id": "2",
|
|
}]),
|
|
)
|
|
.await;
|
|
|
|
// Document 2 should appear before document 1.
|
|
index
|
|
.search(json!({"q": "Captain Marvel", "attributesToRetrieve": ["id"], "attributesToSearchOn": ["desc"]}), |response, code| {
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(json_string!(response["hits"]),
|
|
@r###"
|
|
[
|
|
{
|
|
"id": "2"
|
|
},
|
|
{
|
|
"id": "1"
|
|
}
|
|
]
|
|
"###
|
|
);
|
|
})
|
|
.await;
|
|
}
|