2022-10-03 18:50:06 +02:00
|
|
|
use std::io::Read;
|
2022-10-03 13:57:18 +02:00
|
|
|
use std::path::Path;
|
|
|
|
use std::{fs::File, io::BufReader};
|
|
|
|
|
|
|
|
use flate2::{bufread::GzDecoder, Compression};
|
2022-10-03 18:50:06 +02:00
|
|
|
use index::{Checked, Settings, Unchecked};
|
2022-10-03 13:57:18 +02:00
|
|
|
use index_scheduler::TaskView;
|
|
|
|
use meilisearch_auth::Key;
|
|
|
|
use serde::{Deserialize, Serialize};
|
|
|
|
|
|
|
|
use tempfile::TempDir;
|
|
|
|
use time::OffsetDateTime;
|
2022-10-03 18:50:06 +02:00
|
|
|
use uuid::Uuid;
|
2022-10-03 13:57:18 +02:00
|
|
|
|
2022-10-04 19:13:30 +02:00
|
|
|
use crate::{IndexMetadata, Result, Version};
|
2022-10-03 13:57:18 +02:00
|
|
|
|
|
|
|
// use self::loaders::{v2, v3, v4, v5};
|
|
|
|
|
|
|
|
// pub mod error;
|
|
|
|
// mod compat;
|
|
|
|
// mod loaders;
|
2022-10-03 16:12:01 +02:00
|
|
|
// mod v1;
|
2022-10-04 19:13:30 +02:00
|
|
|
mod v5;
|
2022-10-03 16:12:01 +02:00
|
|
|
mod v6;
|
2022-10-03 13:57:18 +02:00
|
|
|
|
|
|
|
pub fn open(
|
2022-10-03 18:50:06 +02:00
|
|
|
dump: impl Read,
|
2022-10-03 13:57:18 +02:00
|
|
|
) -> Result<
|
2022-10-03 16:12:01 +02:00
|
|
|
Box<
|
|
|
|
dyn DumpReader<
|
|
|
|
Document = serde_json::Map<String, serde_json::Value>,
|
2022-10-03 18:50:06 +02:00
|
|
|
Settings = Settings<Checked>,
|
2022-10-03 16:12:01 +02:00
|
|
|
Task = TaskView,
|
|
|
|
UpdateFile = File,
|
|
|
|
Key = Key,
|
|
|
|
>,
|
2022-10-03 13:57:18 +02:00
|
|
|
>,
|
|
|
|
> {
|
|
|
|
let path = TempDir::new()?;
|
|
|
|
let mut dump = BufReader::new(dump);
|
|
|
|
let gz = GzDecoder::new(&mut dump);
|
|
|
|
let mut archive = tar::Archive::new(gz);
|
|
|
|
archive.unpack(path.path())?;
|
|
|
|
|
|
|
|
#[derive(Deserialize)]
|
2022-10-03 18:50:06 +02:00
|
|
|
#[serde(rename_all = "camelCase")]
|
2022-10-03 13:57:18 +02:00
|
|
|
struct MetadataVersion {
|
|
|
|
pub dump_version: Version,
|
|
|
|
}
|
|
|
|
let mut meta_file = File::open(path.path().join("metadata.json"))?;
|
|
|
|
let MetadataVersion { dump_version } = serde_json::from_reader(&mut meta_file)?;
|
|
|
|
|
|
|
|
match dump_version {
|
|
|
|
// Version::V1 => Ok(Box::new(v1::Reader::open(path)?)),
|
|
|
|
Version::V1 => todo!(),
|
|
|
|
Version::V2 => todo!(),
|
|
|
|
Version::V3 => todo!(),
|
|
|
|
Version::V4 => todo!(),
|
|
|
|
Version::V5 => todo!(),
|
2022-10-03 16:12:01 +02:00
|
|
|
Version::V6 => {
|
|
|
|
let dump_reader = Box::new(v6::V6Reader::open(path)?)
|
|
|
|
as Box<
|
|
|
|
dyn DumpReader<
|
|
|
|
Document = serde_json::Map<String, serde_json::Value>,
|
2022-10-03 18:50:06 +02:00
|
|
|
Settings = Settings<Checked>,
|
2022-10-03 16:12:01 +02:00
|
|
|
Task = TaskView,
|
|
|
|
UpdateFile = File,
|
|
|
|
Key = Key,
|
|
|
|
>,
|
|
|
|
>;
|
|
|
|
|
|
|
|
Ok(dump_reader)
|
|
|
|
}
|
|
|
|
}
|
2022-10-03 13:57:18 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
pub trait DumpReader {
|
|
|
|
type Document;
|
|
|
|
type Settings;
|
|
|
|
|
|
|
|
type Task;
|
|
|
|
type UpdateFile;
|
|
|
|
|
|
|
|
type Key;
|
|
|
|
|
|
|
|
/// Return the version of the dump.
|
|
|
|
fn version(&self) -> Version;
|
|
|
|
|
2022-10-03 18:50:06 +02:00
|
|
|
/// Return at which date the dump was created if there was one.
|
2022-10-03 16:12:01 +02:00
|
|
|
fn date(&self) -> Option<OffsetDateTime>;
|
2022-10-03 13:57:18 +02:00
|
|
|
|
2022-10-03 18:50:06 +02:00
|
|
|
/// Return the instance-uid if there was one.
|
|
|
|
fn instance_uid(&self) -> Result<Option<Uuid>>;
|
|
|
|
|
2022-10-03 13:57:18 +02:00
|
|
|
/// Return an iterator over each indexes.
|
|
|
|
fn indexes(
|
|
|
|
&self,
|
|
|
|
) -> Result<
|
|
|
|
Box<
|
|
|
|
dyn Iterator<
|
2022-10-04 19:13:30 +02:00
|
|
|
Item = Result<
|
|
|
|
Box<
|
|
|
|
dyn IndexReader<Document = Self::Document, Settings = Self::Settings>
|
|
|
|
+ '_,
|
|
|
|
>,
|
|
|
|
>,
|
|
|
|
> + '_,
|
2022-10-03 13:57:18 +02:00
|
|
|
>,
|
|
|
|
>;
|
|
|
|
|
|
|
|
/// Return all the tasks in the dump with a possible update file.
|
|
|
|
fn tasks(
|
2022-10-03 16:12:01 +02:00
|
|
|
&mut self,
|
|
|
|
) -> Box<dyn Iterator<Item = Result<(Self::Task, Option<Self::UpdateFile>)>> + '_>;
|
2022-10-03 13:57:18 +02:00
|
|
|
|
|
|
|
/// Return all the keys.
|
2022-10-03 16:12:01 +02:00
|
|
|
fn keys(&mut self) -> Box<dyn Iterator<Item = Result<Self::Key>> + '_>;
|
2022-10-03 13:57:18 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
pub trait IndexReader {
|
|
|
|
type Document;
|
|
|
|
type Settings;
|
|
|
|
|
2022-10-04 19:13:30 +02:00
|
|
|
fn metadata(&self) -> &IndexMetadata;
|
2022-10-03 16:12:01 +02:00
|
|
|
fn documents(&mut self) -> Result<Box<dyn Iterator<Item = Result<Self::Document>> + '_>>;
|
|
|
|
fn settings(&mut self) -> Result<Self::Settings>;
|
2022-10-03 13:57:18 +02:00
|
|
|
}
|