MeiliSearch/meilisearch-core/src/serde/indexer.rs

363 lines
9.7 KiB
Rust
Raw Normal View History

2020-01-29 18:30:21 +01:00
use meilisearch_schema::IndexedPos;
2019-10-03 11:49:13 +02:00
use serde::ser;
use serde::Serialize;
2019-10-18 13:05:28 +02:00
use super::{ConvertToString, SerializerError};
2019-10-03 11:49:13 +02:00
use crate::raw_indexer::RawIndexer;
2019-10-18 13:05:28 +02:00
use crate::DocumentId;
2019-10-03 11:49:13 +02:00
pub struct Indexer<'a> {
2020-01-10 18:20:30 +01:00
pub pos: IndexedPos,
2019-10-03 11:49:13 +02:00
pub indexer: &'a mut RawIndexer,
pub document_id: DocumentId,
}
impl<'a> ser::Serializer for Indexer<'a> {
type Ok = Option<usize>;
2019-10-03 11:49:13 +02:00
type Error = SerializerError;
type SerializeSeq = SeqIndexer<'a>;
type SerializeTuple = TupleIndexer<'a>;
type SerializeTupleStruct = ser::Impossible<Self::Ok, Self::Error>;
type SerializeTupleVariant = ser::Impossible<Self::Ok, Self::Error>;
type SerializeMap = MapIndexer<'a>;
type SerializeStruct = StructIndexer<'a>;
2019-10-03 11:49:13 +02:00
type SerializeStructVariant = ser::Impossible<Self::Ok, Self::Error>;
fn serialize_bool(self, _value: bool) -> Result<Self::Ok, Self::Error> {
Ok(None)
2019-10-03 11:49:13 +02:00
}
fn serialize_char(self, value: char) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_i8(self, value: i8) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_i16(self, value: i16) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_i32(self, value: i32) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_i64(self, value: i64) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_u8(self, value: u8) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_u16(self, value: u16) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_u32(self, value: u32) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_u64(self, value: u64) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_f32(self, value: f32) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_f64(self, value: f64) -> Result<Self::Ok, Self::Error> {
let text = value.serialize(ConvertToString)?;
self.serialize_str(&text)
}
fn serialize_str(self, text: &str) -> Result<Self::Ok, Self::Error> {
2019-10-18 13:05:28 +02:00
let number_of_words = self
.indexer
2020-01-10 18:20:30 +01:00
.index_text(self.document_id, self.pos, text);
Ok(Some(number_of_words))
2019-10-03 11:49:13 +02:00
}
fn serialize_bytes(self, _v: &[u8]) -> Result<Self::Ok, Self::Error> {
Err(SerializerError::UnindexableType { type_name: "&[u8]" })
}
fn serialize_none(self) -> Result<Self::Ok, Self::Error> {
Ok(None)
2019-10-03 11:49:13 +02:00
}
fn serialize_some<T: ?Sized>(self, value: &T) -> Result<Self::Ok, Self::Error>
2019-10-18 13:05:28 +02:00
where
T: ser::Serialize,
2019-10-03 11:49:13 +02:00
{
let text = value.serialize(ConvertToString)?;
2019-10-18 13:05:28 +02:00
let number_of_words = self
.indexer
2020-01-10 18:20:30 +01:00
.index_text(self.document_id, self.pos, &text);
Ok(Some(number_of_words))
2019-10-03 11:49:13 +02:00
}
fn serialize_unit(self) -> Result<Self::Ok, Self::Error> {
Ok(None)
2019-10-03 11:49:13 +02:00
}
fn serialize_unit_struct(self, _name: &'static str) -> Result<Self::Ok, Self::Error> {
Ok(None)
2019-10-03 11:49:13 +02:00
}
fn serialize_unit_variant(
self,
_name: &'static str,
_variant_index: u32,
2019-10-18 13:05:28 +02:00
_variant: &'static str,
) -> Result<Self::Ok, Self::Error> {
Ok(None)
2019-10-03 11:49:13 +02:00
}
fn serialize_newtype_struct<T: ?Sized>(
self,
_name: &'static str,
2019-10-18 13:05:28 +02:00
value: &T,
2019-10-03 11:49:13 +02:00
) -> Result<Self::Ok, Self::Error>
2019-10-18 13:05:28 +02:00
where
T: ser::Serialize,
2019-10-03 11:49:13 +02:00
{
value.serialize(self)
}
fn serialize_newtype_variant<T: ?Sized>(
self,
_name: &'static str,
_variant_index: u32,
_variant: &'static str,
2019-10-18 13:05:28 +02:00
_value: &T,
2019-10-03 11:49:13 +02:00
) -> Result<Self::Ok, Self::Error>
2019-10-18 13:05:28 +02:00
where
T: ser::Serialize,
2019-10-03 11:49:13 +02:00
{
2019-10-18 13:05:28 +02:00
Err(SerializerError::UnindexableType {
type_name: "newtype variant",
})
2019-10-03 11:49:13 +02:00
}
fn serialize_seq(self, _len: Option<usize>) -> Result<Self::SerializeSeq, Self::Error> {
let indexer = SeqIndexer {
2020-01-10 18:20:30 +01:00
pos: self.pos,
2019-10-03 11:49:13 +02:00
document_id: self.document_id,
indexer: self.indexer,
texts: Vec::new(),
};
Ok(indexer)
}
fn serialize_tuple(self, _len: usize) -> Result<Self::SerializeTuple, Self::Error> {
let indexer = TupleIndexer {
2020-01-10 18:20:30 +01:00
pos: self.pos,
2019-10-03 11:49:13 +02:00
document_id: self.document_id,
indexer: self.indexer,
texts: Vec::new(),
};
Ok(indexer)
}
fn serialize_tuple_struct(
self,
_name: &'static str,
2019-10-18 13:05:28 +02:00
_len: usize,
) -> Result<Self::SerializeTupleStruct, Self::Error> {
Err(SerializerError::UnindexableType {
type_name: "tuple struct",
})
2019-10-03 11:49:13 +02:00
}
fn serialize_tuple_variant(
self,
_name: &'static str,
_variant_index: u32,
_variant: &'static str,
2019-10-18 13:05:28 +02:00
_len: usize,
) -> Result<Self::SerializeTupleVariant, Self::Error> {
Err(SerializerError::UnindexableType {
type_name: "tuple variant",
})
2019-10-03 11:49:13 +02:00
}
fn serialize_map(self, _len: Option<usize>) -> Result<Self::SerializeMap, Self::Error> {
let indexer = MapIndexer {
2020-01-10 18:20:30 +01:00
pos: self.pos,
2019-10-03 11:49:13 +02:00
document_id: self.document_id,
indexer: self.indexer,
texts: Vec::new(),
};
Ok(indexer)
}
fn serialize_struct(
self,
_name: &'static str,
2019-10-18 13:05:28 +02:00
_len: usize,
) -> Result<Self::SerializeStruct, Self::Error> {
let indexer = StructIndexer {
2020-01-10 18:20:30 +01:00
pos: self.pos,
document_id: self.document_id,
indexer: self.indexer,
texts: Vec::new(),
};
Ok(indexer)
2019-10-03 11:49:13 +02:00
}
fn serialize_struct_variant(
self,
_name: &'static str,
_variant_index: u32,
_variant: &'static str,
2019-10-18 13:05:28 +02:00
_len: usize,
) -> Result<Self::SerializeStructVariant, Self::Error> {
Err(SerializerError::UnindexableType {
type_name: "struct variant",
})
2019-10-03 11:49:13 +02:00
}
}
pub struct SeqIndexer<'a> {
2020-01-10 18:20:30 +01:00
pos: IndexedPos,
2019-10-03 11:49:13 +02:00
document_id: DocumentId,
indexer: &'a mut RawIndexer,
texts: Vec<String>,
}
impl<'a> ser::SerializeSeq for SeqIndexer<'a> {
type Ok = Option<usize>;
2019-10-03 11:49:13 +02:00
type Error = SerializerError;
fn serialize_element<T: ?Sized>(&mut self, value: &T) -> Result<(), Self::Error>
2019-10-18 13:05:28 +02:00
where
T: ser::Serialize,
2019-10-03 11:49:13 +02:00
{
let text = value.serialize(ConvertToString)?;
self.texts.push(text);
Ok(())
}
fn end(self) -> Result<Self::Ok, Self::Error> {
let texts = self.texts.iter().map(String::as_str);
2019-10-18 13:05:28 +02:00
self.indexer
2020-01-10 18:20:30 +01:00
.index_text_seq(self.document_id, self.pos, texts);
Ok(None)
2019-10-03 11:49:13 +02:00
}
}
pub struct MapIndexer<'a> {
2020-01-10 18:20:30 +01:00
pos: IndexedPos,
2019-10-03 11:49:13 +02:00
document_id: DocumentId,
indexer: &'a mut RawIndexer,
texts: Vec<String>,
}
impl<'a> ser::SerializeMap for MapIndexer<'a> {
type Ok = Option<usize>;
2019-10-03 11:49:13 +02:00
type Error = SerializerError;
fn serialize_key<T: ?Sized>(&mut self, key: &T) -> Result<(), Self::Error>
2019-10-18 13:05:28 +02:00
where
T: ser::Serialize,
2019-10-03 11:49:13 +02:00
{
let text = key.serialize(ConvertToString)?;
self.texts.push(text);
Ok(())
}
fn serialize_value<T: ?Sized>(&mut self, value: &T) -> Result<(), Self::Error>
2019-10-18 13:05:28 +02:00
where
T: ser::Serialize,
2019-10-03 11:49:13 +02:00
{
let text = value.serialize(ConvertToString)?;
self.texts.push(text);
Ok(())
}
fn end(self) -> Result<Self::Ok, Self::Error> {
let texts = self.texts.iter().map(String::as_str);
2019-10-18 13:05:28 +02:00
self.indexer
2020-01-10 18:20:30 +01:00
.index_text_seq(self.document_id, self.pos, texts);
Ok(None)
2019-10-03 11:49:13 +02:00
}
}
pub struct StructIndexer<'a> {
2020-01-10 18:20:30 +01:00
pos: IndexedPos,
2019-10-03 11:49:13 +02:00
document_id: DocumentId,
indexer: &'a mut RawIndexer,
texts: Vec<String>,
}
impl<'a> ser::SerializeStruct for StructIndexer<'a> {
type Ok = Option<usize>;
2019-10-03 11:49:13 +02:00
type Error = SerializerError;
fn serialize_field<T: ?Sized>(
&mut self,
key: &'static str,
value: &T,
) -> Result<(), Self::Error>
2019-10-18 13:05:28 +02:00
where
T: ser::Serialize,
2019-10-03 11:49:13 +02:00
{
let key_text = key.to_owned();
let value_text = value.serialize(ConvertToString)?;
self.texts.push(key_text);
self.texts.push(value_text);
Ok(())
}
fn end(self) -> Result<Self::Ok, Self::Error> {
let texts = self.texts.iter().map(String::as_str);
2019-10-18 13:05:28 +02:00
self.indexer
2020-01-10 18:20:30 +01:00
.index_text_seq(self.document_id, self.pos, texts);
Ok(None)
2019-10-03 11:49:13 +02:00
}
}
pub struct TupleIndexer<'a> {
2020-01-10 18:20:30 +01:00
pos: IndexedPos,
2019-10-03 11:49:13 +02:00
document_id: DocumentId,
indexer: &'a mut RawIndexer,
texts: Vec<String>,
}
impl<'a> ser::SerializeTuple for TupleIndexer<'a> {
type Ok = Option<usize>;
2019-10-03 11:49:13 +02:00
type Error = SerializerError;
fn serialize_element<T: ?Sized>(&mut self, value: &T) -> Result<(), Self::Error>
2019-10-18 13:05:28 +02:00
where
T: Serialize,
2019-10-03 11:49:13 +02:00
{
let text = value.serialize(ConvertToString)?;
self.texts.push(text);
Ok(())
}
fn end(self) -> Result<Self::Ok, Self::Error> {
let texts = self.texts.iter().map(String::as_str);
2019-10-18 13:05:28 +02:00
self.indexer
2020-01-10 18:20:30 +01:00
.index_text_seq(self.document_id, self.pos, texts);
Ok(None)
2019-10-03 11:49:13 +02:00
}
}