mirror of
https://github.com/meilisearch/MeiliSearch
synced 2025-06-09 17:41:44 +02:00
335 lines
13 KiB
Rust
335 lines
13 KiB
Rust
use actix_web::web::{self, Data};
|
|
use actix_web::{HttpRequest, HttpResponse};
|
|
use deserr::actix_web::{AwebJson, AwebQueryParameter};
|
|
use index_scheduler::IndexScheduler;
|
|
use meilisearch_types::deserr::query_params::Param;
|
|
use meilisearch_types::deserr::{DeserrJsonError, DeserrQueryParamError};
|
|
use meilisearch_types::error::deserr_codes::*;
|
|
use meilisearch_types::error::ResponseError;
|
|
use meilisearch_types::index_uid::IndexUid;
|
|
use meilisearch_types::keys::actions;
|
|
use meilisearch_types::serde_cs::vec::CS;
|
|
use serde_json::Value;
|
|
use tracing::debug;
|
|
use utoipa::{IntoParams, OpenApi};
|
|
|
|
use super::ActionPolicy;
|
|
use crate::analytics::Analytics;
|
|
use crate::extractors::authentication::GuardedData;
|
|
use crate::extractors::sequential_extractor::SeqHandler;
|
|
use crate::routes::indexes::similar_analytics::{SimilarAggregator, SimilarGET, SimilarPOST};
|
|
use crate::search::{
|
|
add_search_rules, perform_similar, RankingScoreThresholdSimilar, RetrieveVectors, Route,
|
|
SearchKind, SimilarQuery, SimilarResult, DEFAULT_SEARCH_LIMIT, DEFAULT_SEARCH_OFFSET,
|
|
};
|
|
|
|
#[derive(OpenApi)]
|
|
#[openapi(
|
|
paths(similar_get, similar_post),
|
|
tags(
|
|
(
|
|
name = "Similar documents",
|
|
description = "The /similar route uses AI-powered search to return a number of documents similar to a target document.
|
|
|
|
Meilisearch exposes two routes for retrieving similar documents: POST and GET. In the majority of cases, POST will offer better performance and ease of use.",
|
|
external_docs(url = "https://www.meilisearch.com/docs/reference/api/similar"),
|
|
),
|
|
),
|
|
)]
|
|
pub struct SimilarApi;
|
|
|
|
pub fn configure(cfg: &mut web::ServiceConfig) {
|
|
cfg.service(
|
|
web::resource("")
|
|
.route(web::get().to(SeqHandler(similar_get)))
|
|
.route(web::post().to(SeqHandler(similar_post))),
|
|
);
|
|
}
|
|
|
|
/// Get similar documents with GET
|
|
///
|
|
/// Retrieve documents similar to a specific search result.
|
|
#[utoipa::path(
|
|
get,
|
|
path = "{indexUid}/similar",
|
|
tag = "Similar documents",
|
|
security(("Bearer" = ["search", "*"])),
|
|
params(
|
|
("indexUid" = String, Path, example = "movies", description = "Index Unique Identifier", nullable = false),
|
|
SimilarQueryGet
|
|
),
|
|
responses(
|
|
(status = 200, description = "The documents are returned", body = SimilarResult, content_type = "application/json", example = json!(
|
|
{
|
|
"hits": [
|
|
{
|
|
"id": 2770,
|
|
"title": "American Pie 2",
|
|
"poster": "https://image.tmdb.org/t/p/w1280/q4LNgUnRfltxzp3gf1MAGiK5LhV.jpg",
|
|
"overview": "The whole gang are back and as close as ever. They decide to get even closer by spending the summer together at a beach house. They decide to hold the biggest…",
|
|
"release_date": 997405200
|
|
},
|
|
{
|
|
"id": 190859,
|
|
"title": "American Sniper",
|
|
"poster": "https://image.tmdb.org/t/p/w1280/svPHnYE7N5NAGO49dBmRhq0vDQ3.jpg",
|
|
"overview": "U.S. Navy SEAL Chris Kyle takes his sole mission—protect his comrades—to heart and becomes one of the most lethal snipers in American history. His pinpoint accuracy not only saves countless lives but also makes him a prime…",
|
|
"release_date": 1418256000
|
|
}
|
|
],
|
|
"offset": 0,
|
|
"limit": 2,
|
|
"estimatedTotalHits": 976,
|
|
"processingTimeMs": 35,
|
|
"query": "american "
|
|
}
|
|
)),
|
|
(status = 404, description = "Index not found", body = ResponseError, content_type = "application/json", example = json!(
|
|
{
|
|
"message": "Index `movies` not found.",
|
|
"code": "index_not_found",
|
|
"type": "invalid_request",
|
|
"link": "https://docs.meilisearch.com/errors#index_not_found"
|
|
}
|
|
)),
|
|
(status = 401, description = "The authorization header is missing", body = ResponseError, content_type = "application/json", example = json!(
|
|
{
|
|
"message": "The Authorization header is missing. It must use the bearer authorization method.",
|
|
"code": "missing_authorization_header",
|
|
"type": "auth",
|
|
"link": "https://docs.meilisearch.com/errors#missing_authorization_header"
|
|
}
|
|
)),
|
|
)
|
|
)]
|
|
pub async fn similar_get(
|
|
index_scheduler: GuardedData<ActionPolicy<{ actions::SEARCH }>, Data<IndexScheduler>>,
|
|
index_uid: web::Path<String>,
|
|
params: AwebQueryParameter<SimilarQueryGet, DeserrQueryParamError>,
|
|
req: HttpRequest,
|
|
analytics: web::Data<Analytics>,
|
|
) -> Result<HttpResponse, ResponseError> {
|
|
let index_uid = IndexUid::try_from(index_uid.into_inner())?;
|
|
|
|
let query = params.0.into();
|
|
|
|
let mut aggregate = SimilarAggregator::<SimilarGET>::from_query(&query);
|
|
|
|
debug!(parameters = ?query, "Similar get");
|
|
|
|
let similar = similar(index_scheduler, index_uid, query).await;
|
|
|
|
if let Ok(similar) = &similar {
|
|
aggregate.succeed(similar);
|
|
}
|
|
analytics.publish(aggregate, &req);
|
|
|
|
let similar = similar?;
|
|
|
|
debug!(returns = ?similar, "Similar get");
|
|
Ok(HttpResponse::Ok().json(similar))
|
|
}
|
|
|
|
/// Get similar documents with POST
|
|
///
|
|
/// Retrieve documents similar to a specific search result.
|
|
#[utoipa::path(
|
|
post,
|
|
path = "{indexUid}/similar",
|
|
tag = "Similar documents",
|
|
security(("Bearer" = ["search", "*"])),
|
|
params(("indexUid" = String, Path, example = "movies", description = "Index Unique Identifier", nullable = false)),
|
|
request_body = SimilarQuery,
|
|
responses(
|
|
(status = 200, description = "The documents are returned", body = SimilarResult, content_type = "application/json", example = json!(
|
|
{
|
|
"hits": [
|
|
{
|
|
"id": 2770,
|
|
"title": "American Pie 2",
|
|
"poster": "https://image.tmdb.org/t/p/w1280/q4LNgUnRfltxzp3gf1MAGiK5LhV.jpg",
|
|
"overview": "The whole gang are back and as close as ever. They decide to get even closer by spending the summer together at a beach house. They decide to hold the biggest…",
|
|
"release_date": 997405200
|
|
},
|
|
{
|
|
"id": 190859,
|
|
"title": "American Sniper",
|
|
"poster": "https://image.tmdb.org/t/p/w1280/svPHnYE7N5NAGO49dBmRhq0vDQ3.jpg",
|
|
"overview": "U.S. Navy SEAL Chris Kyle takes his sole mission—protect his comrades—to heart and becomes one of the most lethal snipers in American history. His pinpoint accuracy not only saves countless lives but also makes him a prime…",
|
|
"release_date": 1418256000
|
|
}
|
|
],
|
|
"offset": 0,
|
|
"limit": 2,
|
|
"estimatedTotalHits": 976,
|
|
"processingTimeMs": 35,
|
|
"query": "american "
|
|
}
|
|
)),
|
|
(status = 404, description = "Index not found", body = ResponseError, content_type = "application/json", example = json!(
|
|
{
|
|
"message": "Index `movies` not found.",
|
|
"code": "index_not_found",
|
|
"type": "invalid_request",
|
|
"link": "https://docs.meilisearch.com/errors#index_not_found"
|
|
}
|
|
)),
|
|
(status = 401, description = "The authorization header is missing", body = ResponseError, content_type = "application/json", example = json!(
|
|
{
|
|
"message": "The Authorization header is missing. It must use the bearer authorization method.",
|
|
"code": "missing_authorization_header",
|
|
"type": "auth",
|
|
"link": "https://docs.meilisearch.com/errors#missing_authorization_header"
|
|
}
|
|
)),
|
|
)
|
|
)]
|
|
pub async fn similar_post(
|
|
index_scheduler: GuardedData<ActionPolicy<{ actions::SEARCH }>, Data<IndexScheduler>>,
|
|
index_uid: web::Path<String>,
|
|
params: AwebJson<SimilarQuery, DeserrJsonError>,
|
|
req: HttpRequest,
|
|
analytics: web::Data<Analytics>,
|
|
) -> Result<HttpResponse, ResponseError> {
|
|
let index_uid = IndexUid::try_from(index_uid.into_inner())?;
|
|
|
|
let query = params.into_inner();
|
|
debug!(parameters = ?query, "Similar post");
|
|
|
|
let mut aggregate = SimilarAggregator::<SimilarPOST>::from_query(&query);
|
|
|
|
let similar = similar(index_scheduler, index_uid, query).await;
|
|
|
|
if let Ok(similar) = &similar {
|
|
aggregate.succeed(similar);
|
|
}
|
|
analytics.publish(aggregate, &req);
|
|
|
|
let similar = similar?;
|
|
|
|
debug!(returns = ?similar, "Similar post");
|
|
Ok(HttpResponse::Ok().json(similar))
|
|
}
|
|
|
|
async fn similar(
|
|
index_scheduler: GuardedData<ActionPolicy<{ actions::SEARCH }>, Data<IndexScheduler>>,
|
|
index_uid: IndexUid,
|
|
mut query: SimilarQuery,
|
|
) -> Result<SimilarResult, ResponseError> {
|
|
let retrieve_vectors = RetrieveVectors::new(query.retrieve_vectors);
|
|
|
|
// Tenant token search_rules.
|
|
if let Some(search_rules) = index_scheduler.filters().get_index_search_rules(&index_uid) {
|
|
add_search_rules(&mut query.filter, search_rules);
|
|
}
|
|
|
|
let index = index_scheduler.index(&index_uid)?;
|
|
|
|
let (embedder_name, embedder, quantized) = SearchKind::embedder(
|
|
&index_scheduler,
|
|
index_uid.to_string(),
|
|
&index,
|
|
&query.embedder,
|
|
None,
|
|
Route::Similar,
|
|
)?;
|
|
|
|
tokio::task::spawn_blocking(move || {
|
|
perform_similar(
|
|
&index,
|
|
query,
|
|
embedder_name,
|
|
embedder,
|
|
quantized,
|
|
retrieve_vectors,
|
|
index_scheduler.features(),
|
|
)
|
|
})
|
|
.await?
|
|
}
|
|
|
|
#[derive(Debug, deserr::Deserr, IntoParams)]
|
|
#[deserr(error = DeserrQueryParamError, rename_all = camelCase, deny_unknown_fields)]
|
|
#[into_params(parameter_in = Query)]
|
|
pub struct SimilarQueryGet {
|
|
#[deserr(error = DeserrQueryParamError<InvalidSimilarId>)]
|
|
#[param(value_type = String)]
|
|
id: Param<String>,
|
|
#[deserr(default = Param(DEFAULT_SEARCH_OFFSET()), error = DeserrQueryParamError<InvalidSimilarOffset>)]
|
|
#[param(value_type = usize, default = DEFAULT_SEARCH_OFFSET)]
|
|
offset: Param<usize>,
|
|
#[deserr(default = Param(DEFAULT_SEARCH_LIMIT()), error = DeserrQueryParamError<InvalidSimilarLimit>)]
|
|
#[param(value_type = usize, default = DEFAULT_SEARCH_LIMIT)]
|
|
limit: Param<usize>,
|
|
#[deserr(default, error = DeserrQueryParamError<InvalidSimilarAttributesToRetrieve>)]
|
|
#[param(value_type = Vec<String>)]
|
|
attributes_to_retrieve: Option<CS<String>>,
|
|
#[deserr(default, error = DeserrQueryParamError<InvalidSimilarRetrieveVectors>)]
|
|
#[param(value_type = bool, default)]
|
|
retrieve_vectors: Param<bool>,
|
|
#[deserr(default, error = DeserrQueryParamError<InvalidSimilarFilter>)]
|
|
filter: Option<String>,
|
|
#[deserr(default, error = DeserrQueryParamError<InvalidSimilarShowRankingScore>)]
|
|
#[param(value_type = bool, default)]
|
|
show_ranking_score: Param<bool>,
|
|
#[deserr(default, error = DeserrQueryParamError<InvalidSimilarShowRankingScoreDetails>)]
|
|
#[param(value_type = bool, default)]
|
|
show_ranking_score_details: Param<bool>,
|
|
#[deserr(default, error = DeserrQueryParamError<InvalidSimilarRankingScoreThreshold>, default)]
|
|
#[param(value_type = Option<f32>)]
|
|
pub ranking_score_threshold: Option<RankingScoreThresholdGet>,
|
|
#[deserr(error = DeserrQueryParamError<InvalidSimilarEmbedder>)]
|
|
pub embedder: String,
|
|
}
|
|
|
|
#[derive(Debug, Clone, Copy, PartialEq, deserr::Deserr)]
|
|
#[deserr(try_from(String) = TryFrom::try_from -> InvalidSimilarRankingScoreThreshold)]
|
|
pub struct RankingScoreThresholdGet(RankingScoreThresholdSimilar);
|
|
|
|
impl std::convert::TryFrom<String> for RankingScoreThresholdGet {
|
|
type Error = InvalidSimilarRankingScoreThreshold;
|
|
|
|
fn try_from(s: String) -> Result<Self, Self::Error> {
|
|
let f: f64 = s.parse().map_err(|_| InvalidSimilarRankingScoreThreshold)?;
|
|
Ok(RankingScoreThresholdGet(RankingScoreThresholdSimilar::try_from(f)?))
|
|
}
|
|
}
|
|
|
|
impl From<SimilarQueryGet> for SimilarQuery {
|
|
fn from(
|
|
SimilarQueryGet {
|
|
id,
|
|
offset,
|
|
limit,
|
|
attributes_to_retrieve,
|
|
retrieve_vectors,
|
|
filter,
|
|
show_ranking_score,
|
|
show_ranking_score_details,
|
|
embedder,
|
|
ranking_score_threshold,
|
|
}: SimilarQueryGet,
|
|
) -> Self {
|
|
let filter = match filter {
|
|
Some(f) => match serde_json::from_str(&f) {
|
|
Ok(v) => Some(v),
|
|
_ => Some(Value::String(f)),
|
|
},
|
|
None => None,
|
|
};
|
|
|
|
SimilarQuery {
|
|
id: serde_json::Value::String(id.0),
|
|
offset: offset.0,
|
|
limit: limit.0,
|
|
filter,
|
|
embedder,
|
|
attributes_to_retrieve: attributes_to_retrieve.map(|o| o.into_iter().collect()),
|
|
retrieve_vectors: retrieve_vectors.0,
|
|
show_ranking_score: show_ranking_score.0,
|
|
show_ranking_score_details: show_ranking_score_details.0,
|
|
ranking_score_threshold: ranking_score_threshold.map(|x| x.0),
|
|
}
|
|
}
|
|
}
|