use std::{ fs::{self, File}, io::{BufRead, BufReader}, path::Path, str::FromStr, }; use index::{Checked, Unchecked}; use tempfile::TempDir; use time::OffsetDateTime; use uuid::Uuid; use crate::{Error, IndexMetadata, Result, Version}; use super::{DumpReader, IndexReader}; type Metadata = crate::Metadata; pub struct V6Reader { dump: TempDir, instance_uid: Uuid, metadata: Metadata, tasks: BufReader, keys: BufReader, } struct V6IndexReader { metadata: IndexMetadata, documents: BufReader, settings: BufReader, } impl V6Reader { pub fn open(dump: TempDir) -> Result { let meta_file = fs::read(dump.path().join("metadata.json"))?; let instance_uid = fs::read_to_string(dump.path().join("instance_uid.uuid"))?; let instance_uid = Uuid::from_str(&instance_uid)?; Ok(V6Reader { metadata: serde_json::from_reader(&*meta_file)?, instance_uid, tasks: BufReader::new(File::open(dump.path().join("tasks").join("queue.jsonl"))?), keys: BufReader::new(File::open(dump.path().join("keys.jsonl"))?), dump, }) } } impl V6IndexReader { pub fn new(name: String, path: &Path) -> Result { let metadata = File::open(path.join("metadata.json"))?; let ret = V6IndexReader { metadata: serde_json::from_reader(metadata)?, documents: BufReader::new(File::open(path.join("documents.jsonl"))?), settings: BufReader::new(File::open(path.join("settings.json"))?), }; Ok(ret) } } impl DumpReader for V6Reader { type Document = serde_json::Map; type Settings = index::Settings; type Task = index_scheduler::TaskView; type UpdateFile = File; type Key = meilisearch_auth::Key; fn version(&self) -> Version { Version::V6 } fn date(&self) -> Option { Some(self.metadata.dump_date) } fn instance_uid(&self) -> Result> { Ok(Some(self.instance_uid)) } fn indexes( &self, ) -> Result< Box< dyn Iterator< Item = Result< Box< dyn super::IndexReader< Document = Self::Document, Settings = Self::Settings, > + '_, >, >, > + '_, >, > { let entries = fs::read_dir(self.dump.path().join("indexes"))?; Ok(Box::new( entries .map(|entry| -> Result> { let entry = entry?; if entry.file_type()?.is_dir() { let index = Box::new(V6IndexReader::new( entry .file_name() .to_str() .ok_or(Error::BadIndexName)? .to_string(), &entry.path(), )?) as Box< dyn IndexReader< Document = Self::Document, Settings = Self::Settings, >, >; Ok(Some(index)) } else { Ok(None) } }) .filter_map(|entry| entry.transpose()), )) } fn tasks( &mut self, ) -> Box)>> + '_> { Box::new((&mut self.tasks).lines().map(|line| -> Result<_> { let mut task: index_scheduler::TaskView = serde_json::from_str(&line?)?; // TODO: this can be removed once we can `Deserialize` the duration from the `TaskView`. if let Some((started_at, finished_at)) = task.started_at.zip(task.finished_at) { task.duration = Some(finished_at - started_at); } let update_file_path = self .dump .path() .join("tasks") .join("update_files") .join(task.uid.to_string()); if update_file_path.exists() { Ok((task, Some(File::open(update_file_path)?))) } else { Ok((task, None)) } })) } fn keys(&mut self) -> Box> + '_> { Box::new( (&mut self.keys) .lines() .map(|line| -> Result<_> { Ok(serde_json::from_str(&line?)?) }), ) } } impl IndexReader for V6IndexReader { type Document = serde_json::Map; type Settings = index::Settings; fn metadata(&self) -> &IndexMetadata { &self.metadata } fn documents(&mut self) -> Result> + '_>> { Ok(Box::new((&mut self.documents).lines().map( |line| -> Result<_> { Ok(serde_json::from_str(&line?)?) }, ))) } fn settings(&mut self) -> Result { let settings: index::Settings = serde_json::from_reader(&mut self.settings)?; Ok(settings.check()) } }