MeiliSearch/meilisearch-http/src/index_controller/snapshot.rs

269 lines
8.4 KiB
Rust
Raw Normal View History

2021-03-23 16:37:46 +01:00
use std::path::{Path, PathBuf};
2021-03-17 11:53:23 +01:00
use std::time::Duration;
2021-06-21 13:57:32 +02:00
use anyhow::bail;
2021-06-23 10:41:55 +02:00
use log::{error, info, trace};
2021-03-25 14:48:51 +01:00
use tokio::fs;
2021-03-22 16:51:53 +01:00
use tokio::task::spawn_blocking;
2021-03-22 19:19:37 +01:00
use tokio::time::sleep;
2021-03-17 11:53:23 +01:00
use super::update_actor::UpdateActorHandle;
use super::uuid_resolver::UuidResolverHandle;
2021-03-23 16:19:01 +01:00
use crate::helpers::compression;
2021-03-17 11:53:23 +01:00
2021-03-23 11:00:50 +01:00
pub struct SnapshotService<U, R> {
uuid_resolver_handle: R,
update_handle: U,
2021-03-17 11:53:23 +01:00
snapshot_period: Duration,
snapshot_path: PathBuf,
2021-03-25 10:23:31 +01:00
db_name: String,
2021-03-17 11:53:23 +01:00
}
2021-03-23 11:00:50 +01:00
impl<U, R> SnapshotService<U, R>
where
U: UpdateActorHandle,
2021-03-23 16:19:01 +01:00
R: UuidResolverHandle,
2021-03-23 11:00:50 +01:00
{
2021-03-17 11:53:23 +01:00
pub fn new(
2021-03-23 11:00:50 +01:00
uuid_resolver_handle: R,
update_handle: U,
2021-03-17 11:53:23 +01:00
snapshot_period: Duration,
snapshot_path: PathBuf,
2021-03-25 10:23:31 +01:00
db_name: String,
2021-03-17 11:53:23 +01:00
) -> Self {
Self {
uuid_resolver_handle,
update_handle,
snapshot_period,
snapshot_path,
2021-03-25 10:23:31 +01:00
db_name,
2021-03-17 11:53:23 +01:00
}
}
pub async fn run(self) {
2021-03-24 11:29:11 +01:00
info!(
2021-03-25 09:34:29 +01:00
"Snapshot scheduled every {}s.",
2021-03-24 11:29:11 +01:00
self.snapshot_period.as_secs()
);
2021-03-17 11:53:23 +01:00
loop {
2021-03-22 19:19:37 +01:00
if let Err(e) = self.perform_snapshot().await {
2021-06-23 10:41:55 +02:00
error!("Error while performing snapshot: {}", e);
2021-03-22 19:19:37 +01:00
}
2021-03-25 09:34:29 +01:00
sleep(self.snapshot_period).await;
2021-03-17 11:53:23 +01:00
}
}
2021-06-15 17:39:07 +02:00
async fn perform_snapshot(&self) -> anyhow::Result<()> {
2021-06-23 10:41:55 +02:00
trace!("Performing snapshot.");
2021-03-24 11:03:01 +01:00
2021-03-25 10:24:33 +01:00
let snapshot_dir = self.snapshot_path.clone();
fs::create_dir_all(&snapshot_dir).await?;
2021-03-25 14:48:51 +01:00
let temp_snapshot_dir =
spawn_blocking(move || tempfile::tempdir_in(snapshot_dir)).await??;
2021-03-22 16:51:53 +01:00
let temp_snapshot_path = temp_snapshot_dir.path().to_owned();
2021-03-23 16:19:01 +01:00
let uuids = self
.uuid_resolver_handle
.snapshot(temp_snapshot_path.clone())
.await?;
2021-03-22 19:19:37 +01:00
if uuids.is_empty() {
2021-03-23 16:19:01 +01:00
return Ok(());
2021-03-22 19:19:37 +01:00
}
2021-04-14 17:53:12 +02:00
self.update_handle
.snapshot(uuids, temp_snapshot_path.clone())
.await?;
2021-03-25 10:23:31 +01:00
let snapshot_dir = self.snapshot_path.clone();
2021-03-25 14:48:51 +01:00
let snapshot_path = self
.snapshot_path
.join(format!("{}.snapshot", self.db_name));
2021-06-15 17:39:07 +02:00
let snapshot_path = spawn_blocking(move || -> anyhow::Result<PathBuf> {
2021-03-25 10:23:31 +01:00
let temp_snapshot_file = tempfile::NamedTempFile::new_in(snapshot_dir)?;
let temp_snapshot_file_path = temp_snapshot_file.path().to_owned();
2021-03-25 10:24:33 +01:00
compression::to_tar_gz(temp_snapshot_path, temp_snapshot_file_path)?;
2021-03-25 10:23:31 +01:00
temp_snapshot_file.persist(&snapshot_path)?;
Ok(snapshot_path)
2021-03-23 16:19:01 +01:00
})
.await??;
2021-03-22 16:51:53 +01:00
2021-06-23 10:41:55 +02:00
trace!("Created snapshot in {:?}.", snapshot_path);
2021-03-22 19:19:37 +01:00
2021-03-19 20:08:00 +01:00
Ok(())
2021-03-17 11:53:23 +01:00
}
}
2021-03-23 16:19:01 +01:00
2021-03-23 16:37:46 +01:00
pub fn load_snapshot(
db_path: impl AsRef<Path>,
snapshot_path: impl AsRef<Path>,
ignore_snapshot_if_db_exists: bool,
ignore_missing_snapshot: bool,
2021-06-15 17:39:07 +02:00
) -> anyhow::Result<()> {
2021-03-23 16:37:46 +01:00
if !db_path.as_ref().exists() && snapshot_path.as_ref().exists() {
2021-03-25 14:48:51 +01:00
match compression::from_tar_gz(snapshot_path, &db_path) {
Ok(()) => Ok(()),
Err(e) => {
// clean created db folder
std::fs::remove_dir_all(&db_path)?;
Err(e)
}
}
2021-03-23 16:37:46 +01:00
} else if db_path.as_ref().exists() && !ignore_snapshot_if_db_exists {
2021-06-21 13:57:32 +02:00
bail!(
2021-03-23 16:37:46 +01:00
"database already exists at {:?}, try to delete it or rename it",
db_path
.as_ref()
.canonicalize()
2021-03-24 11:50:52 +01:00
.unwrap_or_else(|_| db_path.as_ref().to_owned())
2021-03-23 16:37:46 +01:00
)
} else if !snapshot_path.as_ref().exists() && !ignore_missing_snapshot {
2021-06-21 13:57:32 +02:00
bail!(
2021-03-23 16:37:46 +01:00
"snapshot doesn't exist at {:?}",
snapshot_path
.as_ref()
.canonicalize()
2021-03-24 11:50:52 +01:00
.unwrap_or_else(|_| snapshot_path.as_ref().to_owned())
2021-03-23 16:37:46 +01:00
)
} else {
Ok(())
}
}
2021-03-23 16:19:01 +01:00
#[cfg(test)]
mod test {
2021-04-22 10:14:29 +02:00
use std::iter::FromIterator;
use std::{collections::HashSet, sync::Arc};
2021-04-15 19:54:25 +02:00
2021-03-23 16:37:46 +01:00
use futures::future::{err, ok};
2021-03-23 16:19:01 +01:00
use rand::Rng;
use tokio::time::timeout;
use uuid::Uuid;
use super::*;
2021-04-15 19:54:25 +02:00
use crate::index_controller::index_actor::MockIndexActorHandle;
2021-04-22 10:14:29 +02:00
use crate::index_controller::update_actor::{
2021-06-17 14:38:52 +02:00
error::UpdateActorError, MockUpdateActorHandle, UpdateActorHandleImpl,
};
use crate::index_controller::uuid_resolver::{
error::UuidResolverError, MockUuidResolverHandle,
2021-04-22 10:14:29 +02:00
};
2021-03-23 16:19:01 +01:00
#[actix_rt::test]
async fn test_normal() {
let mut rng = rand::thread_rng();
2021-09-08 12:34:56 +02:00
let uuids_num: usize = rng.gen_range(5..10);
2021-04-22 10:14:29 +02:00
let uuids = (0..uuids_num)
.map(|_| Uuid::new_v4())
.collect::<HashSet<_>>();
2021-03-23 16:19:01 +01:00
let mut uuid_resolver = MockUuidResolverHandle::new();
let uuids_clone = uuids.clone();
uuid_resolver
.expect_snapshot()
.times(1)
.returning(move |_| Box::pin(ok(uuids_clone.clone())));
let uuids_clone = uuids.clone();
2021-04-15 19:54:25 +02:00
let mut index_handle = MockIndexActorHandle::new();
index_handle
2021-03-23 16:19:01 +01:00
.expect_snapshot()
.withf(move |uuid, _path| uuids_clone.contains(uuid))
.times(uuids_num)
2021-04-22 10:14:29 +02:00
.returning(move |_, _| Box::pin(ok(())));
2021-04-15 19:54:25 +02:00
let dir = tempfile::tempdir_in(".").unwrap();
let handle = Arc::new(index_handle);
2021-04-22 10:14:29 +02:00
let update_handle =
UpdateActorHandleImpl::<Vec<u8>>::new(handle.clone(), dir.path(), 4096 * 100).unwrap();
2021-03-23 16:19:01 +01:00
2021-03-25 10:24:33 +01:00
let snapshot_path = tempfile::tempdir_in(".").unwrap();
2021-03-23 16:19:01 +01:00
let snapshot_service = SnapshotService::new(
uuid_resolver,
update_handle,
Duration::from_millis(100),
snapshot_path.path().to_owned(),
2021-03-25 10:24:33 +01:00
"data.ms".to_string(),
2021-03-23 16:19:01 +01:00
);
snapshot_service.perform_snapshot().await.unwrap();
}
#[actix_rt::test]
async fn error_performing_uuid_snapshot() {
let mut uuid_resolver = MockUuidResolverHandle::new();
uuid_resolver
.expect_snapshot()
.times(1)
// abitrary error
2021-05-31 16:03:39 +02:00
.returning(|_| Box::pin(err(UuidResolverError::NameAlreadyExist)));
2021-03-23 16:19:01 +01:00
let update_handle = MockUpdateActorHandle::new();
2021-03-25 10:24:33 +01:00
let snapshot_path = tempfile::tempdir_in(".").unwrap();
2021-03-23 16:19:01 +01:00
let snapshot_service = SnapshotService::new(
uuid_resolver,
update_handle,
Duration::from_millis(100),
snapshot_path.path().to_owned(),
2021-03-25 10:24:33 +01:00
"data.ms".to_string(),
2021-03-23 16:19:01 +01:00
);
assert!(snapshot_service.perform_snapshot().await.is_err());
// Nothing was written to the file
2021-03-25 10:24:33 +01:00
assert!(!snapshot_path.path().join("data.ms.snapshot").exists());
2021-03-23 16:19:01 +01:00
}
#[actix_rt::test]
async fn error_performing_index_snapshot() {
let uuid = Uuid::new_v4();
let mut uuid_resolver = MockUuidResolverHandle::new();
uuid_resolver
.expect_snapshot()
.times(1)
2021-04-22 10:14:29 +02:00
.returning(move |_| Box::pin(ok(HashSet::from_iter(Some(uuid)))));
2021-03-23 16:19:01 +01:00
let mut update_handle = MockUpdateActorHandle::new();
update_handle
.expect_snapshot()
// abitrary error
.returning(|_, _| Box::pin(err(UpdateActorError::UnexistingUpdate(0))));
2021-03-23 16:19:01 +01:00
2021-03-25 10:24:33 +01:00
let snapshot_path = tempfile::tempdir_in(".").unwrap();
2021-03-23 16:19:01 +01:00
let snapshot_service = SnapshotService::new(
uuid_resolver,
update_handle,
Duration::from_millis(100),
snapshot_path.path().to_owned(),
2021-03-25 10:24:33 +01:00
"data.ms".to_string(),
2021-03-23 16:19:01 +01:00
);
assert!(snapshot_service.perform_snapshot().await.is_err());
// Nothing was written to the file
2021-03-25 10:24:33 +01:00
assert!(!snapshot_path.path().join("data.ms.snapshot").exists());
2021-03-23 16:19:01 +01:00
}
#[actix_rt::test]
async fn test_loop() {
let mut uuid_resolver = MockUuidResolverHandle::new();
uuid_resolver
.expect_snapshot()
// we expect the funtion to be called between 2 and 3 time in the given interval.
.times(2..4)
// abitrary error, to short-circuit the function
2021-05-31 16:03:39 +02:00
.returning(move |_| Box::pin(err(UuidResolverError::NameAlreadyExist)));
2021-03-23 16:19:01 +01:00
let update_handle = MockUpdateActorHandle::new();
2021-03-25 10:24:33 +01:00
let snapshot_path = tempfile::tempdir_in(".").unwrap();
2021-03-23 16:19:01 +01:00
let snapshot_service = SnapshotService::new(
uuid_resolver,
update_handle,
Duration::from_millis(100),
snapshot_path.path().to_owned(),
2021-03-25 10:24:33 +01:00
"data.ms".to_string(),
2021-03-23 16:19:01 +01:00
);
let _ = timeout(Duration::from_millis(300), snapshot_service.run()).await;
}
}