From ee6a54fe4c81676d1fdbefd4cf274be7a40afc97 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Cl=C3=A9ment=20Renault?= Date: Wed, 4 Sep 2019 14:53:16 +0200 Subject: [PATCH 1/4] feat: Replace the linked-hash-map dependency by indexmap --- meilidb-schema/Cargo.toml | 2 +- meilidb-schema/src/lib.rs | 10 +++++----- meilidb/Cargo.toml | 2 +- meilidb/examples/query-database.rs | 4 ++-- 4 files changed, 9 insertions(+), 9 deletions(-) diff --git a/meilidb-schema/Cargo.toml b/meilidb-schema/Cargo.toml index 86f772452..88178bc1d 100644 --- a/meilidb-schema/Cargo.toml +++ b/meilidb-schema/Cargo.toml @@ -6,7 +6,7 @@ edition = "2018" [dependencies] bincode = "1.1.2" -linked-hash-map = { version = "0.5.2", features = ["serde_impl"] } +indexmap = { version = "1.1.0", features = ["serde-1"] } serde = { version = "1.0.91", features = ["derive"] } serde_json = { version = "1.0.39", features = ["preserve_order"] } toml = { version = "0.5.0", features = ["preserve_order"] } diff --git a/meilidb-schema/src/lib.rs b/meilidb-schema/src/lib.rs index 85325a0f2..0963b68ef 100644 --- a/meilidb-schema/src/lib.rs +++ b/meilidb-schema/src/lib.rs @@ -6,7 +6,7 @@ use std::ops::BitOr; use std::sync::Arc; use serde::{Serialize, Deserialize}; -use linked_hash_map::LinkedHashMap; +use indexmap::IndexMap; pub const DISPLAYED: SchemaProps = SchemaProps { displayed: true, indexed: false, ranked: false }; pub const INDEXED: SchemaProps = SchemaProps { displayed: false, indexed: true, ranked: false }; @@ -53,14 +53,14 @@ impl BitOr for SchemaProps { #[derive(Serialize, Deserialize)] pub struct SchemaBuilder { identifier: String, - attributes: LinkedHashMap, + attributes: IndexMap, } impl SchemaBuilder { pub fn with_identifier>(name: S) -> SchemaBuilder { SchemaBuilder { identifier: name.into(), - attributes: LinkedHashMap::new(), + attributes: IndexMap::new(), } } @@ -147,14 +147,14 @@ impl Schema { bincode::serialize_into(writer, &builder) } - fn attributes_ordered(&self) -> LinkedHashMap { + fn attributes_ordered(&self) -> IndexMap { let mut ordered = BTreeMap::new(); for (name, attr) in &self.inner.attrs { let (_, props) = self.inner.props[attr.0 as usize]; ordered.insert(attr.0, (name, props)); } - let mut attributes = LinkedHashMap::with_capacity(ordered.len()); + let mut attributes = IndexMap::with_capacity(ordered.len()); for (_, (name, props)) in ordered { attributes.insert(name.clone(), props); } diff --git a/meilidb/Cargo.toml b/meilidb/Cargo.toml index 0eecba0a1..96b597741 100644 --- a/meilidb/Cargo.toml +++ b/meilidb/Cargo.toml @@ -14,7 +14,7 @@ csv = "1.0.7" diskus = "0.5.0" env_logger = "0.6.1" jemallocator = "0.1.9" -linked-hash-map = "0.5.2" +indexmap = { version = "1.1.0", features = ["serde-1"] } meilidb-core = { path = "../meilidb-core", version = "0.1.0" } quickcheck = "0.8.2" rand = "0.6.5" diff --git a/meilidb/examples/query-database.rs b/meilidb/examples/query-database.rs index c02dbc5bf..9677eead6 100644 --- a/meilidb/examples/query-database.rs +++ b/meilidb/examples/query-database.rs @@ -9,7 +9,7 @@ use std::iter::FromIterator; use std::path::PathBuf; use std::time::{Instant, Duration}; -use linked_hash_map::LinkedHashMap; +use indexmap::IndexMap; use rustyline::{Editor, Config}; use structopt::StructOpt; use termcolor::{Color, ColorChoice, ColorSpec, StandardStream, WriteColor}; @@ -39,7 +39,7 @@ pub struct Opt { pub char_context: usize, } -type Document = LinkedHashMap; +type Document = IndexMap; fn display_highlights(text: &str, ranges: &[usize]) -> io::Result<()> { let mut stdout = StandardStream::stdout(ColorChoice::Always); From ba3ac5ea7bebaa26390b86472abd09101b355665 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Cl=C3=A9ment=20Renault?= Date: Mon, 16 Sep 2019 14:13:58 +0200 Subject: [PATCH 2/4] chore: Create an internal Schema::to_builder method --- meilidb-schema/src/lib.rs | 15 ++++++++------- 1 file changed, 8 insertions(+), 7 deletions(-) diff --git a/meilidb-schema/src/lib.rs b/meilidb-schema/src/lib.rs index 0963b68ef..6e974594b 100644 --- a/meilidb-schema/src/lib.rs +++ b/meilidb-schema/src/lib.rs @@ -99,6 +99,12 @@ struct InnerSchema { } impl Schema { + fn to_builder(&self) -> SchemaBuilder { + let identifier = self.inner.identifier.clone(); + let attributes = self.attributes_ordered(); + SchemaBuilder { identifier, attributes } + } + pub fn from_toml(mut reader: R) -> Result> { let mut buffer = Vec::new(); reader.read_to_end(&mut buffer)?; @@ -107,10 +113,7 @@ impl Schema { } pub fn to_toml(&self, mut writer: W) -> Result<(), Box> { - let identifier = self.inner.identifier.clone(); - let attributes = self.attributes_ordered(); - let builder = SchemaBuilder { identifier, attributes }; - + let builder = self.to_builder(); let string = toml::to_string_pretty(&builder)?; writer.write_all(string.as_bytes())?; @@ -125,9 +128,7 @@ impl Schema { } pub fn to_json(&self, mut writer: W) -> Result<(), Box> { - let identifier = self.inner.identifier.clone(); - let attributes = self.attributes_ordered(); - let builder = SchemaBuilder { identifier, attributes }; + let builder = self.to_builder(); let string = serde_json::to_string_pretty(&builder)?; writer.write_all(string.as_bytes())?; From ffc29a319f05e0ca98d7cd8a2536fe71556aa368 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Cl=C3=A9ment=20Renault?= Date: Mon, 16 Sep 2019 14:22:59 +0200 Subject: [PATCH 3/4] feat: Implement De/Serialize on schema --- meilidb-schema/src/lib.rs | 17 +++++++++++++++++ 1 file changed, 17 insertions(+) diff --git a/meilidb-schema/src/lib.rs b/meilidb-schema/src/lib.rs index 6e974594b..7e6fcf4b5 100644 --- a/meilidb-schema/src/lib.rs +++ b/meilidb-schema/src/lib.rs @@ -190,6 +190,23 @@ impl Schema { } } +impl Serialize for Schema { + fn serialize(&self, serializer: S) -> Result + where S: serde::ser::Serializer, + { + self.to_builder().serialize(serializer) + } +} + +impl<'de> Deserialize<'de> for Schema { + fn deserialize(deserializer: D) -> Result + where D: serde::de::Deserializer<'de>, + { + let builder = SchemaBuilder::deserialize(deserializer)?; + Ok(builder.build()) + } +} + #[derive(Serialize, Deserialize)] #[derive(Debug, Copy, Clone, PartialOrd, Ord, PartialEq, Eq, Hash)] pub struct SchemaAttr(pub u16); From 35b7b58ff790e696a2324084a8a49eedb80990bd Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Cl=C3=A9ment=20Renault?= Date: Mon, 16 Sep 2019 14:48:33 +0200 Subject: [PATCH 4/4] feat: Remove the Schema to/from_toml/json/bin methods --- meilidb-data/src/database/index/main_index.rs | 5 +- meilidb-schema/src/lib.rs | 62 +++---------------- meilidb/Cargo.toml | 3 +- meilidb/examples/create-database.rs | 6 +- 4 files changed, 15 insertions(+), 61 deletions(-) diff --git a/meilidb-data/src/database/index/main_index.rs b/meilidb-data/src/database/index/main_index.rs index 285aba868..b7141c80f 100644 --- a/meilidb-data/src/database/index/main_index.rs +++ b/meilidb-data/src/database/index/main_index.rs @@ -19,7 +19,7 @@ impl MainIndex { pub fn schema(&self) -> Result, Error> { match self.0.get(SCHEMA_KEY)? { Some(bytes) => { - let schema = Schema::read_from_bin(bytes.as_ref())?; + let schema = bincode::deserialize_from(bytes.as_ref())?; Ok(Some(schema)) }, None => Ok(None), @@ -27,8 +27,7 @@ impl MainIndex { } pub fn set_schema(&self, schema: &Schema) -> Result<(), Error> { - let mut bytes = Vec::new(); - schema.write_to_bin(&mut bytes)?; + let bytes = bincode::serialize(schema)?; self.0.insert(SCHEMA_KEY, bytes)?; Ok(()) } diff --git a/meilidb-schema/src/lib.rs b/meilidb-schema/src/lib.rs index 7e6fcf4b5..4655e2f07 100644 --- a/meilidb-schema/src/lib.rs +++ b/meilidb-schema/src/lib.rs @@ -105,49 +105,6 @@ impl Schema { SchemaBuilder { identifier, attributes } } - pub fn from_toml(mut reader: R) -> Result> { - let mut buffer = Vec::new(); - reader.read_to_end(&mut buffer)?; - let builder: SchemaBuilder = toml::from_slice(&buffer)?; - Ok(builder.build()) - } - - pub fn to_toml(&self, mut writer: W) -> Result<(), Box> { - let builder = self.to_builder(); - let string = toml::to_string_pretty(&builder)?; - writer.write_all(string.as_bytes())?; - - Ok(()) - } - - pub fn from_json(mut reader: R) -> Result> { - let mut buffer = Vec::new(); - reader.read_to_end(&mut buffer)?; - let builder: SchemaBuilder = serde_json::from_slice(&buffer)?; - Ok(builder.build()) - } - - pub fn to_json(&self, mut writer: W) -> Result<(), Box> { - let builder = self.to_builder(); - let string = serde_json::to_string_pretty(&builder)?; - writer.write_all(string.as_bytes())?; - - Ok(()) - } - - pub fn read_from_bin(reader: R) -> bincode::Result { - let builder: SchemaBuilder = bincode::deserialize_from(reader)?; - Ok(builder.build()) - } - - pub fn write_to_bin(&self, writer: W) -> bincode::Result<()> { - let identifier = self.inner.identifier.clone(); - let attributes = self.attributes_ordered(); - let builder = SchemaBuilder { identifier, attributes }; - - bincode::serialize_into(writer, &builder) - } - fn attributes_ordered(&self) -> IndexMap { let mut ordered = BTreeMap::new(); for (name, attr) in &self.inner.attrs { @@ -253,9 +210,8 @@ mod tests { let schema = builder.build(); let mut buffer = Vec::new(); - - schema.write_to_bin(&mut buffer)?; - let schema2 = Schema::read_from_bin(buffer.as_slice())?; + bincode::serialize_into(&mut buffer, &schema)?; + let schema2 = bincode::deserialize_from(buffer.as_slice())?; assert_eq!(schema, schema2); @@ -270,10 +226,9 @@ mod tests { builder.new_attribute("gamma", INDEXED); let schema = builder.build(); - let mut buffer = Vec::new(); - schema.to_toml(&mut buffer)?; + let buffer = toml::to_vec(&schema)?; + let schema2 = toml::from_slice(buffer.as_slice())?; - let schema2 = Schema::from_toml(buffer.as_slice())?; assert_eq!(schema, schema2); let data = r#" @@ -289,7 +244,7 @@ mod tests { [attributes."gamma"] indexed = true "#; - let schema2 = Schema::from_toml(data.as_bytes())?; + let schema2 = toml::from_str(data)?; assert_eq!(schema, schema2); Ok(()) @@ -303,10 +258,9 @@ mod tests { builder.new_attribute("gamma", INDEXED); let schema = builder.build(); - let mut buffer = Vec::new(); - schema.to_json(&mut buffer)?; + let buffer = serde_json::to_vec(&schema)?; + let schema2 = serde_json::from_slice(buffer.as_slice())?; - let schema2 = Schema::from_json(buffer.as_slice())?; assert_eq!(schema, schema2); let data = r#" @@ -325,7 +279,7 @@ mod tests { } } }"#; - let schema2 = Schema::from_json(data.as_bytes())?; + let schema2 = serde_json::from_str(data)?; assert_eq!(schema, schema2); Ok(()) diff --git a/meilidb/Cargo.toml b/meilidb/Cargo.toml index 96b597741..c4a4a07e9 100644 --- a/meilidb/Cargo.toml +++ b/meilidb/Cargo.toml @@ -13,8 +13,8 @@ meilidb-schema = { path = "../meilidb-schema", version = "0.1.0" } csv = "1.0.7" diskus = "0.5.0" env_logger = "0.6.1" -jemallocator = "0.1.9" indexmap = { version = "1.1.0", features = ["serde-1"] } +jemallocator = "0.1.9" meilidb-core = { path = "../meilidb-core", version = "0.1.0" } quickcheck = "0.8.2" rand = "0.6.5" @@ -26,3 +26,4 @@ structopt = "0.2.15" sysinfo = "0.8.4" tempfile = "3.0.7" termcolor = "1.0.4" +toml = "0.5.3" diff --git a/meilidb/examples/create-database.rs b/meilidb/examples/create-database.rs index d49979f28..c9326b6c1 100644 --- a/meilidb/examples/create-database.rs +++ b/meilidb/examples/create-database.rs @@ -6,7 +6,7 @@ use std::io::{self, BufRead, BufReader}; use std::path::{Path, PathBuf}; use std::time::Instant; use std::error::Error; -use std::fs::File; +use std::fs::{self, File}; use diskus::Walk; use sysinfo::{SystemExt, ProcessExt}; @@ -181,8 +181,8 @@ fn main() -> Result<(), Box> { let opt = Opt::from_args(); let schema = { - let file = File::open(&opt.schema_path)?; - Schema::from_toml(file)? + let string = fs::read_to_string(&opt.schema_path)?; + toml::from_str(&string)? }; let stop_words = match opt.stop_words {