MeiliSearch/meilidb-core/src/database.rs

181 lines
6.2 KiB
Rust
Raw Normal View History

use std::collections::hash_map::{HashMap, Entry};
use std::fs::File;
use std::path::Path;
use std::sync::{Arc, RwLock};
use std::{fs, thread};
use zlmdb::{Result as ZResult, CompactionOption};
2019-10-16 17:05:24 +02:00
use zlmdb::types::{Str, Unit};
use crossbeam_channel::Receiver;
use log::{debug, error};
use crate::{store, update, Index, MResult};
2019-10-09 11:45:19 +02:00
pub type BoxUpdateFn = Box<dyn Fn(update::UpdateResult) + Send + Sync + 'static>;
type ArcSwapFn = arc_swap::ArcSwapOption<BoxUpdateFn>;
pub struct Database {
2019-10-16 17:05:24 +02:00
pub env: zlmdb::Env,
common_store: zlmdb::DynDatabase,
indexes_store: zlmdb::Database<Str, Unit>,
2019-10-09 11:45:19 +02:00
indexes: RwLock<HashMap<String, (Index, Arc<ArcSwapFn>, thread::JoinHandle<()>)>>,
}
2019-10-09 11:45:19 +02:00
fn update_awaiter(
receiver: Receiver<()>,
2019-10-16 17:05:24 +02:00
env: zlmdb::Env,
2019-10-09 11:45:19 +02:00
update_fn: Arc<ArcSwapFn>,
index: Index,
) {
for () in receiver {
// consume all updates in order (oldest first)
loop {
2019-10-16 17:05:24 +02:00
let mut writer = match env.write_txn() {
Ok(writer) => writer,
Err(e) => { error!("LMDB writer transaction begin failed: {}", e); break }
};
2019-10-09 17:23:48 +02:00
match update::update_task(&mut writer, index.clone()) {
Ok(Some(status)) => {
if let Err(e) = writer.commit() { error!("update transaction failed: {}", e) }
if let Some(ref callback) = *update_fn.load() {
(callback)(status);
}
},
// no more updates to handle for now
2019-10-09 17:23:48 +02:00
Ok(None) => { debug!("no more updates"); writer.abort(); break },
Err(e) => { error!("update task failed: {}", e); writer.abort() },
}
}
}
}
impl Database {
pub fn open_or_create(path: impl AsRef<Path>) -> MResult<Database> {
fs::create_dir_all(path.as_ref())?;
2019-10-16 17:05:24 +02:00
let env = zlmdb::EnvOpenOptions::new()
.map_size(10 * 1024 * 1024 * 1024) // 10GB
.max_dbs(3000)
.open(path)?;
2019-10-16 17:05:24 +02:00
let common_store = env.create_dyn_database(Some("common"))?;
let indexes_store = env.create_database::<Str, Unit>(Some("indexes"))?;
// list all indexes that needs to be opened
let mut must_open = Vec::new();
2019-10-16 17:05:24 +02:00
let reader = env.read_txn()?;
for result in indexes_store.iter(&reader)? {
let (index_name, _) = result?;
must_open.push(index_name.to_owned());
}
2019-10-16 17:05:24 +02:00
reader.abort();
// open the previously aggregated indexes
let mut indexes = HashMap::new();
for index_name in must_open {
let (sender, receiver) = crossbeam_channel::bounded(100);
2019-10-16 17:05:24 +02:00
let index = match store::open(&env, &index_name, sender.clone())? {
Some(index) => index,
None => {
log::warn!("the index {} doesn't exist or has not all the databases", index_name);
continue;
},
};
2019-10-09 11:45:19 +02:00
let update_fn = Arc::new(ArcSwapFn::empty());
2019-10-16 17:05:24 +02:00
let env_clone = env.clone();
let index_clone = index.clone();
2019-10-09 11:45:19 +02:00
let update_fn_clone = update_fn.clone();
let handle = thread::spawn(move || {
2019-10-16 17:05:24 +02:00
update_awaiter(receiver, env_clone, update_fn_clone, index_clone)
2019-10-09 11:45:19 +02:00
});
// send an update notification to make sure that
2019-10-16 17:05:24 +02:00
// possible pre-boot updates are consumed
sender.send(()).unwrap();
2019-10-09 11:45:19 +02:00
let result = indexes.insert(index_name, (index, update_fn, handle));
assert!(result.is_none(), "The index should not have been already open");
}
2019-10-16 17:05:24 +02:00
Ok(Database { env, common_store, indexes_store, indexes: RwLock::new(indexes) })
}
pub fn open_index(&self, name: impl AsRef<str>) -> Option<Index> {
let indexes_lock = self.indexes.read().unwrap();
match indexes_lock.get(name.as_ref()) {
Some((index, ..)) => Some(index.clone()),
None => None,
}
}
pub fn create_index(&self, name: impl AsRef<str>) -> MResult<Index> {
let name = name.as_ref();
let mut indexes_lock = self.indexes.write().unwrap();
match indexes_lock.entry(name.to_owned()) {
Entry::Occupied(_) => Err(crate::Error::IndexAlreadyExists),
Entry::Vacant(entry) => {
let (sender, receiver) = crossbeam_channel::bounded(100);
2019-10-16 17:05:24 +02:00
let index = store::create(&self.env, name, sender)?;
2019-10-16 17:05:24 +02:00
let mut writer = self.env.write_txn()?;
self.indexes_store.put(&mut writer, name, &())?;
2019-10-09 11:45:19 +02:00
2019-10-16 17:05:24 +02:00
let env_clone = self.env.clone();
let index_clone = index.clone();
2019-10-09 11:45:19 +02:00
let no_update_fn = Arc::new(ArcSwapFn::empty());
let no_update_fn_clone = no_update_fn.clone();
2019-10-09 11:45:19 +02:00
let handle = thread::spawn(move || {
2019-10-16 17:05:24 +02:00
update_awaiter(receiver, env_clone, no_update_fn_clone, index_clone)
});
writer.commit()?;
entry.insert((index.clone(), no_update_fn, handle));
Ok(index)
}
}
}
pub fn set_update_callback(&self, name: impl AsRef<str>, update_fn: BoxUpdateFn) -> bool {
let indexes_lock = self.indexes.read().unwrap();
match indexes_lock.get(name.as_ref()) {
Some((_, current_update_fn, _)) => {
let update_fn = Some(Arc::new(update_fn));
current_update_fn.swap(update_fn);
true
},
None => false,
}
}
pub fn unset_update_callback(&self, name: impl AsRef<str>) -> bool {
let indexes_lock = self.indexes.read().unwrap();
match indexes_lock.get(name.as_ref()) {
Some((_, current_update_fn, _)) => { current_update_fn.swap(None); true },
None => false,
}
}
pub fn copy_and_compact_to_path<P: AsRef<Path>>(&self, path: P) -> ZResult<File> {
self.env.copy_to_path(path, CompactionOption::Enabled)
}
pub fn indexes_names(&self) -> MResult<Vec<String>> {
let indexes = self.indexes.read().unwrap();
Ok(indexes.keys().cloned().collect())
}
2019-10-16 17:05:24 +02:00
pub fn common_store(&self) -> zlmdb::DynDatabase {
2019-10-10 15:14:32 +02:00
self.common_store
}
}