mirror of
https://github.com/meilisearch/MeiliSearch
synced 2024-11-10 15:08:56 +01:00
254 lines
12 KiB
Rust
254 lines
12 KiB
Rust
use meili_snap::snapshot;
|
|
use once_cell::sync::Lazy;
|
|
|
|
use crate::common::index::Index;
|
|
use crate::common::{Server, Value};
|
|
use crate::json;
|
|
|
|
async fn index_with_documents<'a>(server: &'a Server, documents: &Value) -> Index<'a> {
|
|
let index = server.index("test");
|
|
|
|
let (response, code) = server.set_features(json!({"vectorStore": true})).await;
|
|
|
|
meili_snap::snapshot!(code, @"200 OK");
|
|
meili_snap::snapshot!(meili_snap::json_string!(response), @r###"
|
|
{
|
|
"vectorStore": true,
|
|
"metrics": false,
|
|
"logsRoute": false,
|
|
"exportPuffinReports": false
|
|
}
|
|
"###);
|
|
|
|
let (response, code) = index
|
|
.update_settings(json!({ "embedders": {"default": {
|
|
"source": "userProvided",
|
|
"dimensions": 2}}} ))
|
|
.await;
|
|
assert_eq!(202, code, "{:?}", response);
|
|
index.wait_task(response.uid()).await;
|
|
|
|
let (response, code) = index.add_documents(documents.clone(), None).await;
|
|
assert_eq!(202, code, "{:?}", response);
|
|
index.wait_task(response.uid()).await;
|
|
index
|
|
}
|
|
|
|
static SIMPLE_SEARCH_DOCUMENTS: Lazy<Value> = Lazy::new(|| {
|
|
json!([
|
|
{
|
|
"title": "Shazam!",
|
|
"desc": "a Captain Marvel ersatz",
|
|
"id": "1",
|
|
"_vectors": {"default": [1.0, 3.0]},
|
|
},
|
|
{
|
|
"title": "Captain Planet",
|
|
"desc": "He's not part of the Marvel Cinematic Universe",
|
|
"id": "2",
|
|
"_vectors": {"default": [1.0, 2.0]},
|
|
},
|
|
{
|
|
"title": "Captain Marvel",
|
|
"desc": "a Shazam ersatz",
|
|
"id": "3",
|
|
"_vectors": {"default": [2.0, 3.0]},
|
|
}])
|
|
});
|
|
|
|
static SINGLE_DOCUMENT: Lazy<Value> = Lazy::new(|| {
|
|
json!([{
|
|
"title": "Shazam!",
|
|
"desc": "a Captain Marvel ersatz",
|
|
"id": "1",
|
|
"_vectors": {"default": [1.0, 3.0]},
|
|
}])
|
|
});
|
|
|
|
#[actix_rt::test]
|
|
async fn simple_search() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
let (response, code) = index
|
|
.search_post(
|
|
json!({"q": "Captain", "vector": [1.0, 1.0], "hybrid": {"semanticRatio": 0.2}}),
|
|
)
|
|
.await;
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"], @r###"[{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2","_vectors":{"default":[1.0,2.0]}},{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":[2.0,3.0]}},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":[1.0,3.0]}}]"###);
|
|
|
|
let (response, code) = index
|
|
.search_post(
|
|
json!({"q": "Captain", "vector": [1.0, 1.0], "hybrid": {"semanticRatio": 0.8}}),
|
|
)
|
|
.await;
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"], @r###"[{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":[2.0,3.0]},"_semanticScore":0.99029034},{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2","_vectors":{"default":[1.0,2.0]},"_semanticScore":0.97434163},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":[1.0,3.0]},"_semanticScore":0.9472136}]"###);
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn distribution_shift() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
let search = json!({"q": "Captain", "vector": [1.0, 1.0], "showRankingScore": true, "hybrid": {"semanticRatio": 1.0}});
|
|
let (response, code) = index.search_post(search.clone()).await;
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"], @r###"[{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":[2.0,3.0]},"_rankingScore":0.990290343761444,"_semanticScore":0.99029034},{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2","_vectors":{"default":[1.0,2.0]},"_rankingScore":0.974341630935669,"_semanticScore":0.97434163},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":[1.0,3.0]},"_rankingScore":0.9472135901451112,"_semanticScore":0.9472136}]"###);
|
|
|
|
let (response, code) = index
|
|
.update_settings(json!({
|
|
"embedders": {
|
|
"default": {
|
|
"distribution": {
|
|
"mean": 0.998,
|
|
"sigma": 0.01
|
|
}
|
|
}
|
|
}
|
|
}))
|
|
.await;
|
|
|
|
snapshot!(code, @"202 Accepted");
|
|
let response = server.wait_task(response.uid()).await;
|
|
snapshot!(response["details"], @r###"{"embedders":{"default":{"distribution":{"mean":0.998,"sigma":0.01}}}}"###);
|
|
|
|
let (response, code) = index.search_post(search).await;
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"], @r###"[{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":[2.0,3.0]},"_rankingScore":0.19161224365234375,"_semanticScore":0.19161224},{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2","_vectors":{"default":[1.0,2.0]},"_rankingScore":1.1920928955078125e-7,"_semanticScore":1.1920929e-7},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":[1.0,3.0]},"_rankingScore":1.1920928955078125e-7,"_semanticScore":1.1920929e-7}]"###);
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn highlighter() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
let (response, code) = index
|
|
.search_post(json!({"q": "Captain Marvel", "vector": [1.0, 1.0],
|
|
"hybrid": {"semanticRatio": 0.2},
|
|
"attributesToHighlight": [
|
|
"desc"
|
|
],
|
|
"highlightPreTag": "**BEGIN**",
|
|
"highlightPostTag": "**END**"
|
|
}))
|
|
.await;
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"], @r###"[{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":[2.0,3.0]},"_formatted":{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":["2.0","3.0"]}}},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":[1.0,3.0]},"_formatted":{"title":"Shazam!","desc":"a **BEGIN**Captain**END** **BEGIN**Marvel**END** ersatz","id":"1","_vectors":{"default":["1.0","3.0"]}}},{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2","_vectors":{"default":[1.0,2.0]},"_formatted":{"title":"Captain Planet","desc":"He's not part of the **BEGIN**Marvel**END** Cinematic Universe","id":"2","_vectors":{"default":["1.0","2.0"]}}}]"###);
|
|
|
|
let (response, code) = index
|
|
.search_post(json!({"q": "Captain Marvel", "vector": [1.0, 1.0],
|
|
"hybrid": {"semanticRatio": 0.8},
|
|
"attributesToHighlight": [
|
|
"desc"
|
|
],
|
|
"highlightPreTag": "**BEGIN**",
|
|
"highlightPostTag": "**END**"
|
|
}))
|
|
.await;
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"], @r###"[{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":[2.0,3.0]},"_formatted":{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":["2.0","3.0"]}},"_semanticScore":0.99029034},{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2","_vectors":{"default":[1.0,2.0]},"_formatted":{"title":"Captain Planet","desc":"He's not part of the **BEGIN**Marvel**END** Cinematic Universe","id":"2","_vectors":{"default":["1.0","2.0"]}},"_semanticScore":0.97434163},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":[1.0,3.0]},"_formatted":{"title":"Shazam!","desc":"a **BEGIN**Captain**END** **BEGIN**Marvel**END** ersatz","id":"1","_vectors":{"default":["1.0","3.0"]}},"_semanticScore":0.9472136}]"###);
|
|
|
|
// no highlighting on full semantic
|
|
let (response, code) = index
|
|
.search_post(json!({"q": "Captain Marvel", "vector": [1.0, 1.0],
|
|
"hybrid": {"semanticRatio": 1.0},
|
|
"attributesToHighlight": [
|
|
"desc"
|
|
],
|
|
"highlightPreTag": "**BEGIN**",
|
|
"highlightPostTag": "**END**"
|
|
}))
|
|
.await;
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"], @r###"[{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":[2.0,3.0]},"_formatted":{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3","_vectors":{"default":["2.0","3.0"]}},"_semanticScore":0.99029034},{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2","_vectors":{"default":[1.0,2.0]},"_formatted":{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2","_vectors":{"default":["1.0","2.0"]}},"_semanticScore":0.97434163},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":[1.0,3.0]},"_formatted":{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":["1.0","3.0"]}}}]"###);
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn invalid_semantic_ratio() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await;
|
|
|
|
let (response, code) = index
|
|
.search_post(
|
|
json!({"q": "Captain", "vector": [1.0, 1.0], "hybrid": {"semanticRatio": 1.2}}),
|
|
)
|
|
.await;
|
|
snapshot!(code, @"400 Bad Request");
|
|
snapshot!(response, @r###"
|
|
{
|
|
"message": "Invalid value at `.hybrid.semanticRatio`: the value of `semanticRatio` is invalid, expected a float between `0.0` and `1.0`.",
|
|
"code": "invalid_search_semantic_ratio",
|
|
"type": "invalid_request",
|
|
"link": "https://docs.meilisearch.com/errors#invalid_search_semantic_ratio"
|
|
}
|
|
"###);
|
|
|
|
let (response, code) = index
|
|
.search_post(
|
|
json!({"q": "Captain", "vector": [1.0, 1.0], "hybrid": {"semanticRatio": -0.8}}),
|
|
)
|
|
.await;
|
|
snapshot!(code, @"400 Bad Request");
|
|
snapshot!(response, @r###"
|
|
{
|
|
"message": "Invalid value at `.hybrid.semanticRatio`: the value of `semanticRatio` is invalid, expected a float between `0.0` and `1.0`.",
|
|
"code": "invalid_search_semantic_ratio",
|
|
"type": "invalid_request",
|
|
"link": "https://docs.meilisearch.com/errors#invalid_search_semantic_ratio"
|
|
}
|
|
"###);
|
|
|
|
let (response, code) = index
|
|
.search_get(
|
|
&yaup::to_string(
|
|
&json!({"q": "Captain", "vector": [1.0, 1.0], "hybridSemanticRatio": 1.2}),
|
|
)
|
|
.unwrap(),
|
|
)
|
|
.await;
|
|
snapshot!(code, @"400 Bad Request");
|
|
snapshot!(response, @r###"
|
|
{
|
|
"message": "Invalid value in parameter `hybridSemanticRatio`: the value of `semanticRatio` is invalid, expected a float between `0.0` and `1.0`.",
|
|
"code": "invalid_search_semantic_ratio",
|
|
"type": "invalid_request",
|
|
"link": "https://docs.meilisearch.com/errors#invalid_search_semantic_ratio"
|
|
}
|
|
"###);
|
|
|
|
let (response, code) = index
|
|
.search_get(
|
|
&yaup::to_string(
|
|
&json!({"q": "Captain", "vector": [1.0, 1.0], "hybridSemanticRatio": -0.2}),
|
|
)
|
|
.unwrap(),
|
|
)
|
|
.await;
|
|
snapshot!(code, @"400 Bad Request");
|
|
snapshot!(response, @r###"
|
|
{
|
|
"message": "Invalid value in parameter `hybridSemanticRatio`: the value of `semanticRatio` is invalid, expected a float between `0.0` and `1.0`.",
|
|
"code": "invalid_search_semantic_ratio",
|
|
"type": "invalid_request",
|
|
"link": "https://docs.meilisearch.com/errors#invalid_search_semantic_ratio"
|
|
}
|
|
"###);
|
|
}
|
|
|
|
#[actix_rt::test]
|
|
async fn single_document() {
|
|
let server = Server::new().await;
|
|
let index = index_with_documents(&server, &SINGLE_DOCUMENT).await;
|
|
|
|
let (response, code) = index
|
|
.search_post(
|
|
json!({"vector": [1.0, 3.0], "hybrid": {"semanticRatio": 1.0}, "showRankingScore": true}),
|
|
)
|
|
.await;
|
|
|
|
snapshot!(code, @"200 OK");
|
|
snapshot!(response["hits"][0], @r###"{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1","_vectors":{"default":[1.0,3.0]},"_rankingScore":1.0,"_semanticScore":1.0}"###);
|
|
}
|