mirror of
https://github.com/meilisearch/MeiliSearch
synced 2025-01-12 06:24:29 +01:00
feat: Introduce a basic RocksDB based version
This commit is contained in:
parent
3a8da82792
commit
4c973238a1
@ -16,7 +16,7 @@ ordered-float = { version = "1.0.2", features = ["serde"] }
|
|||||||
sdset = "0.3.2"
|
sdset = "0.3.2"
|
||||||
serde = { version = "1.0.91", features = ["derive"] }
|
serde = { version = "1.0.91", features = ["derive"] }
|
||||||
serde_json = { version = "1.0.39", features = ["preserve_order"] }
|
serde_json = { version = "1.0.39", features = ["preserve_order"] }
|
||||||
sled = "0.23.0"
|
rocksdb = "0.12.2"
|
||||||
toml = { version = "0.5.0", features = ["preserve_order"] }
|
toml = { version = "0.5.0", features = ["preserve_order"] }
|
||||||
zerocopy = "0.2.2"
|
zerocopy = "0.2.2"
|
||||||
|
|
||||||
@ -28,9 +28,5 @@ rev = "40b3d48"
|
|||||||
git = "https://github.com/Kerollmops/fst.git"
|
git = "https://github.com/Kerollmops/fst.git"
|
||||||
branch = "arc-byte-slice"
|
branch = "arc-byte-slice"
|
||||||
|
|
||||||
[features]
|
|
||||||
default = []
|
|
||||||
compression = ["sled/compression"]
|
|
||||||
|
|
||||||
[dev-dependencies]
|
[dev-dependencies]
|
||||||
tempfile = "3.0.7"
|
tempfile = "3.0.7"
|
||||||
|
@ -2,12 +2,12 @@ use std::sync::Arc;
|
|||||||
use std::ops::Deref;
|
use std::ops::Deref;
|
||||||
|
|
||||||
#[derive(Clone)]
|
#[derive(Clone)]
|
||||||
pub struct CustomSettings(pub Arc<sled::Tree>);
|
pub struct CustomSettings(pub Arc<rocksdb::DB>, pub String);
|
||||||
|
|
||||||
impl Deref for CustomSettings {
|
impl Deref for CustomSettings {
|
||||||
type Target = sled::Tree;
|
type Target = rocksdb::DB;
|
||||||
|
|
||||||
fn deref(&self) -> &sled::Tree {
|
fn deref(&self) -> &Self::Target {
|
||||||
&self.0
|
&self.0
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -3,15 +3,16 @@ use meilidb_core::DocumentId;
|
|||||||
use super::Error;
|
use super::Error;
|
||||||
|
|
||||||
#[derive(Clone)]
|
#[derive(Clone)]
|
||||||
pub struct DocsWordsIndex(pub Arc<sled::Tree>);
|
pub struct DocsWordsIndex(pub Arc<rocksdb::DB>, pub String);
|
||||||
|
|
||||||
impl DocsWordsIndex {
|
impl DocsWordsIndex {
|
||||||
pub fn doc_words(&self, id: DocumentId) -> Result<Option<fst::Set>, Error> {
|
pub fn doc_words(&self, id: DocumentId) -> Result<Option<fst::Set>, Error> {
|
||||||
let key = id.0.to_be_bytes();
|
let key = id.0.to_be_bytes();
|
||||||
match self.0.get(key)? {
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
match self.0.get_pinned_cf(cf, key)? {
|
||||||
Some(bytes) => {
|
Some(bytes) => {
|
||||||
let len = bytes.len();
|
let len = bytes.len();
|
||||||
let value = bytes.into();
|
let value = Arc::from(bytes.as_ref());
|
||||||
let fst = fst::raw::Fst::from_shared_bytes(value, 0, len)?;
|
let fst = fst::raw::Fst::from_shared_bytes(value, 0, len)?;
|
||||||
Ok(Some(fst::Set::from(fst)))
|
Ok(Some(fst::Set::from(fst)))
|
||||||
},
|
},
|
||||||
@ -21,13 +22,15 @@ impl DocsWordsIndex {
|
|||||||
|
|
||||||
pub fn set_doc_words(&self, id: DocumentId, words: &fst::Set) -> Result<(), Error> {
|
pub fn set_doc_words(&self, id: DocumentId, words: &fst::Set) -> Result<(), Error> {
|
||||||
let key = id.0.to_be_bytes();
|
let key = id.0.to_be_bytes();
|
||||||
self.0.set(key, words.as_fst().as_bytes())?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.put_cf(cf, key, words.as_fst().as_bytes())?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn del_doc_words(&self, id: DocumentId) -> Result<(), Error> {
|
pub fn del_doc_words(&self, id: DocumentId) -> Result<(), Error> {
|
||||||
let key = id.0.to_be_bytes();
|
let key = id.0.to_be_bytes();
|
||||||
self.0.del(key)?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.delete_cf(cf, key)?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -2,69 +2,77 @@ use std::sync::Arc;
|
|||||||
use std::convert::TryInto;
|
use std::convert::TryInto;
|
||||||
|
|
||||||
use meilidb_core::DocumentId;
|
use meilidb_core::DocumentId;
|
||||||
use sled::IVec;
|
use rocksdb::DBVector;
|
||||||
|
|
||||||
use crate::document_attr_key::DocumentAttrKey;
|
use crate::document_attr_key::DocumentAttrKey;
|
||||||
use crate::schema::SchemaAttr;
|
use crate::schema::SchemaAttr;
|
||||||
|
|
||||||
#[derive(Clone)]
|
#[derive(Clone)]
|
||||||
pub struct DocumentsIndex(pub Arc<sled::Tree>);
|
pub struct DocumentsIndex(pub Arc<rocksdb::DB>, pub String);
|
||||||
|
|
||||||
impl DocumentsIndex {
|
impl DocumentsIndex {
|
||||||
pub fn document_field(&self, id: DocumentId, attr: SchemaAttr) -> sled::Result<Option<IVec>> {
|
pub fn document_field(&self, id: DocumentId, attr: SchemaAttr) -> Result<Option<DBVector>, rocksdb::Error> {
|
||||||
let key = DocumentAttrKey::new(id, attr).to_be_bytes();
|
let key = DocumentAttrKey::new(id, attr).to_be_bytes();
|
||||||
self.0.get(key)
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.get_cf(cf, key)
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn set_document_field(&self, id: DocumentId, attr: SchemaAttr, value: Vec<u8>) -> sled::Result<()> {
|
pub fn set_document_field(&self, id: DocumentId, attr: SchemaAttr, value: Vec<u8>) -> Result<(), rocksdb::Error> {
|
||||||
let key = DocumentAttrKey::new(id, attr).to_be_bytes();
|
let key = DocumentAttrKey::new(id, attr).to_be_bytes();
|
||||||
self.0.set(key, value)?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.put_cf(cf, key, value)?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn del_document_field(&self, id: DocumentId, attr: SchemaAttr) -> sled::Result<()> {
|
pub fn del_document_field(&self, id: DocumentId, attr: SchemaAttr) -> Result<(), rocksdb::Error> {
|
||||||
let key = DocumentAttrKey::new(id, attr).to_be_bytes();
|
let key = DocumentAttrKey::new(id, attr).to_be_bytes();
|
||||||
self.0.del(key)?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.delete_cf(cf, key)?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn del_all_document_fields(&self, id: DocumentId) -> sled::Result<()> {
|
pub fn del_all_document_fields(&self, id: DocumentId) -> Result<(), rocksdb::Error> {
|
||||||
let start = DocumentAttrKey::new(id, SchemaAttr::min()).to_be_bytes();
|
let start = DocumentAttrKey::new(id, SchemaAttr::min()).to_be_bytes();
|
||||||
let end = DocumentAttrKey::new(id, SchemaAttr::max()).to_be_bytes();
|
let end = DocumentAttrKey::new(id, SchemaAttr::max()).to_be_bytes();
|
||||||
let document_attrs = self.0.range(start..=end).keys();
|
|
||||||
|
|
||||||
for key in document_attrs {
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
self.0.del(key?)?;
|
let mut batch = rocksdb::WriteBatch::default();
|
||||||
}
|
batch.delete_range_cf(cf, start, end)?;
|
||||||
|
self.0.write(batch)?;
|
||||||
|
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn document_fields(&self, id: DocumentId) -> DocumentFieldsIter {
|
pub fn document_fields(&self, id: DocumentId) -> DocumentFieldsIter {
|
||||||
let start = DocumentAttrKey::new(id, SchemaAttr::min());
|
let start = DocumentAttrKey::new(id, SchemaAttr::min()).to_be_bytes();
|
||||||
let start = start.to_be_bytes();
|
let end = DocumentAttrKey::new(id, SchemaAttr::max()).to_be_bytes();
|
||||||
|
|
||||||
let end = DocumentAttrKey::new(id, SchemaAttr::max());
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
let end = end.to_be_bytes();
|
let from = rocksdb::IteratorMode::From(&start[..], rocksdb::Direction::Forward);
|
||||||
|
let iter = self.0.iterator_cf(cf, from).unwrap();
|
||||||
|
|
||||||
DocumentFieldsIter(self.0.range(start..=end))
|
DocumentFieldsIter(iter, end.to_vec())
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
pub struct DocumentFieldsIter<'a>(sled::Iter<'a>);
|
pub struct DocumentFieldsIter<'a>(rocksdb::DBIterator<'a>, Vec<u8>);
|
||||||
|
|
||||||
impl<'a> Iterator for DocumentFieldsIter<'a> {
|
impl<'a> Iterator for DocumentFieldsIter<'a> {
|
||||||
type Item = sled::Result<(SchemaAttr, IVec)>;
|
type Item = Result<(SchemaAttr, Box<[u8]>), rocksdb::Error>;
|
||||||
|
|
||||||
fn next(&mut self) -> Option<Self::Item> {
|
fn next(&mut self) -> Option<Self::Item> {
|
||||||
match self.0.next() {
|
match self.0.next() {
|
||||||
Some(Ok((key, value))) => {
|
Some((key, value)) => {
|
||||||
|
|
||||||
|
if key.as_ref() > self.1.as_ref() {
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
|
||||||
let slice: &[u8] = key.as_ref();
|
let slice: &[u8] = key.as_ref();
|
||||||
let array = slice.try_into().unwrap();
|
let array = slice.try_into().unwrap();
|
||||||
let key = DocumentAttrKey::from_be_bytes(array);
|
let key = DocumentAttrKey::from_be_bytes(array);
|
||||||
Some(Ok((key.attribute, value)))
|
Some(Ok((key.attribute, value)))
|
||||||
},
|
},
|
||||||
Some(Err(e)) => Some(Err(e)),
|
|
||||||
None => None,
|
None => None,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -7,15 +7,15 @@ pub enum Error {
|
|||||||
SchemaMissing,
|
SchemaMissing,
|
||||||
WordIndexMissing,
|
WordIndexMissing,
|
||||||
MissingDocumentId,
|
MissingDocumentId,
|
||||||
SledError(sled::Error),
|
RocksdbError(rocksdb::Error),
|
||||||
FstError(fst::Error),
|
FstError(fst::Error),
|
||||||
BincodeError(bincode::Error),
|
BincodeError(bincode::Error),
|
||||||
SerializerError(SerializerError),
|
SerializerError(SerializerError),
|
||||||
}
|
}
|
||||||
|
|
||||||
impl From<sled::Error> for Error {
|
impl From<rocksdb::Error> for Error {
|
||||||
fn from(error: sled::Error) -> Error {
|
fn from(error: rocksdb::Error) -> Error {
|
||||||
Error::SledError(error)
|
Error::RocksdbError(error)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -45,7 +45,7 @@ impl fmt::Display for Error {
|
|||||||
SchemaMissing => write!(f, "this index does not have a schema"),
|
SchemaMissing => write!(f, "this index does not have a schema"),
|
||||||
WordIndexMissing => write!(f, "this index does not have a word index"),
|
WordIndexMissing => write!(f, "this index does not have a word index"),
|
||||||
MissingDocumentId => write!(f, "document id is missing"),
|
MissingDocumentId => write!(f, "document id is missing"),
|
||||||
SledError(e) => write!(f, "sled error; {}", e),
|
RocksdbError(e) => write!(f, "RocksDB error; {}", e),
|
||||||
FstError(e) => write!(f, "fst error; {}", e),
|
FstError(e) => write!(f, "fst error; {}", e),
|
||||||
BincodeError(e) => write!(f, "bincode error; {}", e),
|
BincodeError(e) => write!(f, "bincode error; {}", e),
|
||||||
SerializerError(e) => write!(f, "serializer error; {}", e),
|
SerializerError(e) => write!(f, "serializer error; {}", e),
|
||||||
|
@ -6,11 +6,12 @@ use crate::schema::Schema;
|
|||||||
use super::Error;
|
use super::Error;
|
||||||
|
|
||||||
#[derive(Clone)]
|
#[derive(Clone)]
|
||||||
pub struct MainIndex(pub Arc<sled::Tree>);
|
pub struct MainIndex(pub Arc<rocksdb::DB>, pub String);
|
||||||
|
|
||||||
impl MainIndex {
|
impl MainIndex {
|
||||||
pub fn schema(&self) -> Result<Option<Schema>, Error> {
|
pub fn schema(&self) -> Result<Option<Schema>, Error> {
|
||||||
match self.0.get("schema")? {
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
match self.0.get_cf(cf, "schema")? {
|
||||||
Some(bytes) => {
|
Some(bytes) => {
|
||||||
let schema = Schema::read_from_bin(bytes.as_ref())?;
|
let schema = Schema::read_from_bin(bytes.as_ref())?;
|
||||||
Ok(Some(schema))
|
Ok(Some(schema))
|
||||||
@ -22,15 +23,17 @@ impl MainIndex {
|
|||||||
pub fn set_schema(&self, schema: &Schema) -> Result<(), Error> {
|
pub fn set_schema(&self, schema: &Schema) -> Result<(), Error> {
|
||||||
let mut bytes = Vec::new();
|
let mut bytes = Vec::new();
|
||||||
schema.write_to_bin(&mut bytes)?;
|
schema.write_to_bin(&mut bytes)?;
|
||||||
self.0.set("schema", bytes)?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.put_cf(cf, "schema", bytes)?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn words_set(&self) -> Result<Option<fst::Set>, Error> {
|
pub fn words_set(&self) -> Result<Option<fst::Set>, Error> {
|
||||||
match self.0.get("words")? {
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
match self.0.get_pinned_cf(cf, "words")? {
|
||||||
Some(bytes) => {
|
Some(bytes) => {
|
||||||
let len = bytes.len();
|
let len = bytes.len();
|
||||||
let value = bytes.into();
|
let value = Arc::from(bytes.as_ref());
|
||||||
let fst = fst::raw::Fst::from_shared_bytes(value, 0, len)?;
|
let fst = fst::raw::Fst::from_shared_bytes(value, 0, len)?;
|
||||||
Ok(Some(fst::Set::from(fst)))
|
Ok(Some(fst::Set::from(fst)))
|
||||||
},
|
},
|
||||||
@ -39,12 +42,14 @@ impl MainIndex {
|
|||||||
}
|
}
|
||||||
|
|
||||||
pub fn set_words_set(&self, value: &fst::Set) -> Result<(), Error> {
|
pub fn set_words_set(&self, value: &fst::Set) -> Result<(), Error> {
|
||||||
self.0.set("words", value.as_fst().as_bytes())?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.put_cf(cf, "words", value.as_fst().as_bytes())?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn ranked_map(&self) -> Result<Option<RankedMap>, Error> {
|
pub fn ranked_map(&self) -> Result<Option<RankedMap>, Error> {
|
||||||
match self.0.get("ranked-map")? {
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
match self.0.get_cf(cf, "ranked-map")? {
|
||||||
Some(bytes) => {
|
Some(bytes) => {
|
||||||
let ranked_map = RankedMap::read_from_bin(bytes.as_ref())?;
|
let ranked_map = RankedMap::read_from_bin(bytes.as_ref())?;
|
||||||
Ok(Some(ranked_map))
|
Ok(Some(ranked_map))
|
||||||
@ -56,7 +61,8 @@ impl MainIndex {
|
|||||||
pub fn set_ranked_map(&self, value: &RankedMap) -> Result<(), Error> {
|
pub fn set_ranked_map(&self, value: &RankedMap) -> Result<(), Error> {
|
||||||
let mut bytes = Vec::new();
|
let mut bytes = Vec::new();
|
||||||
value.write_to_bin(&mut bytes)?;
|
value.write_to_bin(&mut bytes)?;
|
||||||
self.0.set("ranked_map", bytes)?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.put_cf(cf, "ranked_map", bytes)?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -31,26 +31,24 @@ use self::words_index::WordsIndex;
|
|||||||
|
|
||||||
pub struct Database {
|
pub struct Database {
|
||||||
cache: RwLock<HashMap<String, Arc<Index>>>,
|
cache: RwLock<HashMap<String, Arc<Index>>>,
|
||||||
inner: sled::Db,
|
inner: Arc<rocksdb::DB>,
|
||||||
}
|
}
|
||||||
|
|
||||||
impl Database {
|
impl Database {
|
||||||
pub fn start_default<P: AsRef<Path>>(path: P) -> Result<Database, Error> {
|
pub fn start_default<P: AsRef<Path>>(path: P) -> Result<Database, Error> {
|
||||||
|
let path = path.as_ref();
|
||||||
let cache = RwLock::new(HashMap::new());
|
let cache = RwLock::new(HashMap::new());
|
||||||
let config = sled::ConfigBuilder::new().path(path).print_profile_on_drop(true).build();
|
|
||||||
let inner = sled::Db::start(config)?;
|
|
||||||
Ok(Database { cache, inner })
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn start_with_compression<P: AsRef<Path>>(path: P, factor: i32) -> Result<Database, Error> {
|
let inner = {
|
||||||
let config = sled::ConfigBuilder::default()
|
let options = {
|
||||||
.use_compression(true)
|
let mut options = rocksdb::Options::default();
|
||||||
.compression_factor(factor)
|
options.create_if_missing(true);
|
||||||
.path(path)
|
options
|
||||||
.build();
|
};
|
||||||
|
let cfs = rocksdb::DB::list_cf(&options, path).unwrap_or(Vec::new());
|
||||||
|
Arc::new(rocksdb::DB::open_cf(&options, path, cfs)?)
|
||||||
|
};
|
||||||
|
|
||||||
let cache = RwLock::new(HashMap::new());
|
|
||||||
let inner = sled::Db::start(config)?;
|
|
||||||
Ok(Database { cache, inner })
|
Ok(Database { cache, inner })
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -66,7 +64,7 @@ impl Database {
|
|||||||
|
|
||||||
fn set_indexes(&self, value: &HashSet<String>) -> Result<(), Error> {
|
fn set_indexes(&self, value: &HashSet<String>) -> Result<(), Error> {
|
||||||
let bytes = bincode::serialize(value)?;
|
let bytes = bincode::serialize(value)?;
|
||||||
self.inner.set("indexes", bytes)?;
|
self.inner.put("indexes", bytes)?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -89,32 +87,32 @@ impl Database {
|
|||||||
}
|
}
|
||||||
|
|
||||||
let main = {
|
let main = {
|
||||||
let tree = self.inner.open_tree(name)?;
|
self.inner.cf_handle(name).expect("cf not found");
|
||||||
MainIndex(tree)
|
MainIndex(self.inner.clone(), name.to_owned())
|
||||||
};
|
};
|
||||||
|
|
||||||
let words = {
|
let words = {
|
||||||
let tree_name = format!("{}-words", name);
|
let cf_name = format!("{}-words", name);
|
||||||
let tree = self.inner.open_tree(tree_name)?;
|
self.inner.cf_handle(&cf_name).expect("cf not found");
|
||||||
WordsIndex(tree)
|
WordsIndex(self.inner.clone(), cf_name)
|
||||||
};
|
};
|
||||||
|
|
||||||
let docs_words = {
|
let docs_words = {
|
||||||
let tree_name = format!("{}-docs-words", name);
|
let cf_name = format!("{}-docs-words", name);
|
||||||
let tree = self.inner.open_tree(tree_name)?;
|
self.inner.cf_handle(&cf_name).expect("cf not found");
|
||||||
DocsWordsIndex(tree)
|
DocsWordsIndex(self.inner.clone(), cf_name)
|
||||||
};
|
};
|
||||||
|
|
||||||
let documents = {
|
let documents = {
|
||||||
let tree_name = format!("{}-documents", name);
|
let cf_name = format!("{}-documents", name);
|
||||||
let tree = self.inner.open_tree(tree_name)?;
|
self.inner.cf_handle(&cf_name).expect("cf not found");
|
||||||
DocumentsIndex(tree)
|
DocumentsIndex(self.inner.clone(), cf_name)
|
||||||
};
|
};
|
||||||
|
|
||||||
let custom = {
|
let custom = {
|
||||||
let tree_name = format!("{}-custom", name);
|
let cf_name = format!("{}-custom", name);
|
||||||
let tree = self.inner.open_tree(tree_name)?;
|
self.inner.cf_handle(&cf_name).expect("cf not found");
|
||||||
CustomSettings(tree)
|
CustomSettings(self.inner.clone(), cf_name)
|
||||||
};
|
};
|
||||||
|
|
||||||
let raw_index = RawIndex { main, words, docs_words, documents, custom };
|
let raw_index = RawIndex { main, words, docs_words, documents, custom };
|
||||||
@ -136,8 +134,8 @@ impl Database {
|
|||||||
},
|
},
|
||||||
Entry::Vacant(vacant) => {
|
Entry::Vacant(vacant) => {
|
||||||
let main = {
|
let main = {
|
||||||
let tree = self.inner.open_tree(name)?;
|
self.inner.create_cf(name, &rocksdb::Options::default())?;
|
||||||
MainIndex(tree)
|
MainIndex(self.inner.clone(), name.to_owned())
|
||||||
};
|
};
|
||||||
|
|
||||||
if let Some(prev_schema) = main.schema()? {
|
if let Some(prev_schema) = main.schema()? {
|
||||||
@ -149,27 +147,27 @@ impl Database {
|
|||||||
main.set_schema(&schema)?;
|
main.set_schema(&schema)?;
|
||||||
|
|
||||||
let words = {
|
let words = {
|
||||||
let tree_name = format!("{}-words", name);
|
let cf_name = format!("{}-words", name);
|
||||||
let tree = self.inner.open_tree(tree_name)?;
|
self.inner.create_cf(&cf_name, &rocksdb::Options::default())?;
|
||||||
WordsIndex(tree)
|
WordsIndex(self.inner.clone(), cf_name)
|
||||||
};
|
};
|
||||||
|
|
||||||
let docs_words = {
|
let docs_words = {
|
||||||
let tree_name = format!("{}-docs-words", name);
|
let cf_name = format!("{}-docs-words", name);
|
||||||
let tree = self.inner.open_tree(tree_name)?;
|
self.inner.create_cf(&cf_name, &rocksdb::Options::default())?;
|
||||||
DocsWordsIndex(tree)
|
DocsWordsIndex(self.inner.clone(), cf_name)
|
||||||
};
|
};
|
||||||
|
|
||||||
let documents = {
|
let documents = {
|
||||||
let tree_name = format!("{}-documents", name);
|
let cf_name = format!("{}-documents", name);
|
||||||
let tree = self.inner.open_tree(tree_name)?;
|
self.inner.create_cf(&cf_name, &rocksdb::Options::default())?;
|
||||||
DocumentsIndex(tree)
|
DocumentsIndex(self.inner.clone(), cf_name)
|
||||||
};
|
};
|
||||||
|
|
||||||
let custom = {
|
let custom = {
|
||||||
let tree_name = format!("{}-custom", name);
|
let cf_name = format!("{}-custom", name);
|
||||||
let tree = self.inner.open_tree(tree_name)?;
|
self.inner.create_cf(&cf_name, &rocksdb::Options::default())?;
|
||||||
CustomSettings(tree)
|
CustomSettings(self.inner.clone(), cf_name)
|
||||||
};
|
};
|
||||||
|
|
||||||
let mut indexes = self.indexes()?.unwrap_or_else(HashSet::new);
|
let mut indexes = self.indexes()?.unwrap_or_else(HashSet::new);
|
||||||
|
@ -5,11 +5,12 @@ use sdset::{Set, SetBuf};
|
|||||||
use zerocopy::{LayoutVerified, AsBytes};
|
use zerocopy::{LayoutVerified, AsBytes};
|
||||||
|
|
||||||
#[derive(Clone)]
|
#[derive(Clone)]
|
||||||
pub struct WordsIndex(pub Arc<sled::Tree>);
|
pub struct WordsIndex(pub Arc<rocksdb::DB>, pub String);
|
||||||
|
|
||||||
impl WordsIndex {
|
impl WordsIndex {
|
||||||
pub fn doc_indexes(&self, word: &[u8]) -> sled::Result<Option<SetBuf<DocIndex>>> {
|
pub fn doc_indexes(&self, word: &[u8]) -> Result<Option<SetBuf<DocIndex>>, rocksdb::Error> {
|
||||||
match self.0.get(word)? {
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
match self.0.get_cf(cf, word)? {
|
||||||
Some(bytes) => {
|
Some(bytes) => {
|
||||||
let layout = LayoutVerified::new_slice(bytes.as_ref()).expect("invalid layout");
|
let layout = LayoutVerified::new_slice(bytes.as_ref()).expect("invalid layout");
|
||||||
let slice = layout.into_slice();
|
let slice = layout.into_slice();
|
||||||
@ -20,13 +21,15 @@ impl WordsIndex {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn set_doc_indexes(&self, word: &[u8], set: &Set<DocIndex>) -> sled::Result<()> {
|
pub fn set_doc_indexes(&self, word: &[u8], set: &Set<DocIndex>) -> Result<(), rocksdb::Error> {
|
||||||
self.0.set(word, set.as_bytes())?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.put_cf(cf, word, set.as_bytes())?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn del_doc_indexes(&self, word: &[u8]) -> sled::Result<()> {
|
pub fn del_doc_indexes(&self, word: &[u8]) -> Result<(), rocksdb::Error> {
|
||||||
self.0.del(word)?;
|
let cf = self.0.cf_handle(&self.1).unwrap();
|
||||||
|
self.0.delete_cf(cf, word)?;
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -6,7 +6,7 @@ mod ranked_map;
|
|||||||
mod serde;
|
mod serde;
|
||||||
pub mod schema;
|
pub mod schema;
|
||||||
|
|
||||||
pub use sled;
|
pub use rocksdb;
|
||||||
pub use self::database::{Database, Index, CustomSettings};
|
pub use self::database::{Database, Index, CustomSettings};
|
||||||
pub use self::number::Number;
|
pub use self::number::Number;
|
||||||
pub use self::ranked_map::RankedMap;
|
pub use self::ranked_map::RankedMap;
|
||||||
|
@ -36,7 +36,7 @@ use crate::schema::SchemaAttr;
|
|||||||
pub enum SerializerError {
|
pub enum SerializerError {
|
||||||
DocumentIdNotFound,
|
DocumentIdNotFound,
|
||||||
RmpError(RmpError),
|
RmpError(RmpError),
|
||||||
SledError(sled::Error),
|
RocksdbError(rocksdb::Error),
|
||||||
ParseNumberError(ParseNumberError),
|
ParseNumberError(ParseNumberError),
|
||||||
UnserializableType { type_name: &'static str },
|
UnserializableType { type_name: &'static str },
|
||||||
UnindexableType { type_name: &'static str },
|
UnindexableType { type_name: &'static str },
|
||||||
@ -57,7 +57,7 @@ impl fmt::Display for SerializerError {
|
|||||||
write!(f, "serialized document does not have an id according to the schema")
|
write!(f, "serialized document does not have an id according to the schema")
|
||||||
}
|
}
|
||||||
SerializerError::RmpError(e) => write!(f, "rmp serde related error: {}", e),
|
SerializerError::RmpError(e) => write!(f, "rmp serde related error: {}", e),
|
||||||
SerializerError::SledError(e) => write!(f, "sled related error: {}", e),
|
SerializerError::RocksdbError(e) => write!(f, "RocksDB related error: {}", e),
|
||||||
SerializerError::ParseNumberError(e) => {
|
SerializerError::ParseNumberError(e) => {
|
||||||
write!(f, "error while trying to parse a number: {}", e)
|
write!(f, "error while trying to parse a number: {}", e)
|
||||||
},
|
},
|
||||||
@ -89,9 +89,9 @@ impl From<RmpError> for SerializerError {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
impl From<sled::Error> for SerializerError {
|
impl From<rocksdb::Error> for SerializerError {
|
||||||
fn from(error: sled::Error) -> SerializerError {
|
fn from(error: rocksdb::Error) -> SerializerError {
|
||||||
SerializerError::SledError(error)
|
SerializerError::RocksdbError(error)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -59,7 +59,7 @@ fn index(
|
|||||||
|
|
||||||
let mut system = sysinfo::System::new();
|
let mut system = sysinfo::System::new();
|
||||||
|
|
||||||
let index = database.create_index("default", schema.clone())?;
|
let index = database.create_index("test", schema.clone())?;
|
||||||
|
|
||||||
let mut rdr = csv::Reader::from_path(csv_data_path)?;
|
let mut rdr = csv::Reader::from_path(csv_data_path)?;
|
||||||
let mut raw_record = csv::StringRecord::new();
|
let mut raw_record = csv::StringRecord::new();
|
||||||
|
@ -143,7 +143,7 @@ fn main() -> Result<(), Box<Error>> {
|
|||||||
let mut buffer = String::new();
|
let mut buffer = String::new();
|
||||||
let input = io::stdin();
|
let input = io::stdin();
|
||||||
|
|
||||||
let index = database.open_index("default")?.unwrap();
|
let index = database.open_index("test")?.unwrap();
|
||||||
let schema = index.schema();
|
let schema = index.schema();
|
||||||
|
|
||||||
println!("database prepared for you in {:.2?}", start.elapsed());
|
println!("database prepared for you in {:.2?}", start.elapsed());
|
||||||
|
Loading…
x
Reference in New Issue
Block a user