mirror of
https://github.com/meilisearch/MeiliSearch
synced 2025-01-11 22:14:32 +01:00
feat: Introduce a little simple http server for demo
This commit is contained in:
parent
4b36fa0739
commit
08d89053da
29
README.md
29
README.md
@ -59,15 +59,34 @@ We have seen much better performances when [using jemalloc as the global allocat
|
||||
|
||||
## Usage and examples
|
||||
|
||||
MeiliDB runs with an index like most search engines.
|
||||
So to test the library you can create one by indexing a simple csv file.
|
||||
You can test a little part of MeiliDB by using this command, it create an index named _movies_ and initialize it with to great Tarantino movies.
|
||||
|
||||
```bash
|
||||
cargo run --release --example create-database -- test.mdb examples/movies/movies.csv --schema examples/movies/schema-movies.toml
|
||||
cargo run --release
|
||||
|
||||
curl -XPOST 'http://127.0.0.1:8000/movies' \
|
||||
-d '
|
||||
identifier = "id"
|
||||
|
||||
[attributes.id]
|
||||
stored = true
|
||||
|
||||
[attributes.title]
|
||||
stored = true
|
||||
indexed = true
|
||||
'
|
||||
|
||||
curl -H 'Content-Type: application/json' \
|
||||
-XPUT 'http://127.0.0.1:8000/movies' \
|
||||
-d '{ "id": 123, "title": "Inglorious Bastards" }'
|
||||
|
||||
curl -H 'Content-Type: application/json' \
|
||||
-XPUT 'http://127.0.0.1:8000/movies' \
|
||||
-d '{ "id": 456, "title": "Django Unchained" }'
|
||||
```
|
||||
|
||||
Once the command is executed, the index should be in the `test.mdb` folder. You are now able to run the `query-database` example and play with MeiliDB.
|
||||
Once the database is initialized you can query it by using the following command:
|
||||
|
||||
```bash
|
||||
cargo run --release --example query-database -- test.mdb -n 10 id title overview release_date
|
||||
curl -XGET 'http://127.0.0.1:8000/movies/search?q=inglo'
|
||||
```
|
||||
|
@ -14,7 +14,7 @@ meilidb-core = { path = "../meilidb-core", version = "0.1.0" }
|
||||
meilidb-tokenizer = { path = "../meilidb-tokenizer", version = "0.1.0" }
|
||||
ordered-float = { version = "1.0.2", features = ["serde"] }
|
||||
sdset = "0.3.1"
|
||||
serde = { version = "1.0.90", features = ["derive"] }
|
||||
serde = { version = "1.0.91", features = ["derive"] }
|
||||
serde_json = { version = "1.0.39", features = ["preserve_order"] }
|
||||
sled = "0.23.0"
|
||||
toml = { version = "0.5.0", features = ["preserve_order"] }
|
||||
|
@ -5,23 +5,19 @@ version = "0.3.1"
|
||||
authors = ["Kerollmops <renault.cle@gmail.com>"]
|
||||
|
||||
[dependencies]
|
||||
meilidb-core = { path = "../meilidb-core", version = "0.1.0" }
|
||||
meilidb-data = { path = "../meilidb-data", version = "0.1.0" }
|
||||
meilidb-tokenizer = { path = "../meilidb-tokenizer", version = "0.1.0" }
|
||||
|
||||
[features]
|
||||
default = []
|
||||
i128 = ["meilidb-core/i128"]
|
||||
nightly = ["meilidb-core/nightly"]
|
||||
serde = { version = "1.0.91" , features = ["derive"] }
|
||||
serde_json = "1.0.39"
|
||||
tempfile = "3.0.7"
|
||||
tide = "0.2.0"
|
||||
|
||||
[dev-dependencies]
|
||||
meilidb-core = { path = "../meilidb-core", version = "0.1.0" }
|
||||
csv = "1.0.7"
|
||||
env_logger = "0.6.1"
|
||||
jemallocator = "0.1.9"
|
||||
quickcheck = "0.8.2"
|
||||
rand = "0.6.5"
|
||||
rand_xorshift = "0.1.1"
|
||||
serde = { version = "1.0.90", features = ["derive"] }
|
||||
structopt = "0.2.15"
|
||||
tempfile = "3.0.7"
|
||||
termcolor = "1.0.4"
|
||||
|
@ -1,26 +0,0 @@
|
||||
use std::io::{self, BufReader, BufRead};
|
||||
use std::collections::HashSet;
|
||||
use std::path::Path;
|
||||
use std::fs::File;
|
||||
|
||||
#[derive(Debug)]
|
||||
pub struct CommonWords(HashSet<String>);
|
||||
|
||||
impl CommonWords {
|
||||
pub fn from_file<P>(path: P) -> io::Result<Self>
|
||||
where P: AsRef<Path>
|
||||
{
|
||||
let file = File::open(path)?;
|
||||
let file = BufReader::new(file);
|
||||
let mut set = HashSet::new();
|
||||
for line in file.lines().filter_map(|l| l.ok()) {
|
||||
let word = line.trim().to_owned();
|
||||
set.insert(word);
|
||||
}
|
||||
Ok(CommonWords(set))
|
||||
}
|
||||
|
||||
pub fn contains(&self, word: &str) -> bool {
|
||||
self.0.contains(word)
|
||||
}
|
||||
}
|
@ -1,7 +0,0 @@
|
||||
#![cfg_attr(feature = "nightly", feature(test))]
|
||||
|
||||
mod common_words;
|
||||
mod sort_by_attr;
|
||||
|
||||
pub use self::sort_by_attr::SortByAttr;
|
||||
pub use self::common_words::CommonWords;
|
74
meilidb/src/main.rs
Normal file
74
meilidb/src/main.rs
Normal file
@ -0,0 +1,74 @@
|
||||
#![feature(async_await)]
|
||||
|
||||
use std::collections::HashMap;
|
||||
|
||||
use serde::{Deserialize, Serialize};
|
||||
use tide::querystring::ExtractQuery;
|
||||
use tide::http::status::StatusCode;
|
||||
use tide::{error::ResultExt, response, App, Context, EndpointResult};
|
||||
use serde_json::Value;
|
||||
use meilidb_data::{Database, Schema};
|
||||
|
||||
#[derive(Debug, Serialize, Deserialize, Clone)]
|
||||
struct SearchQuery {
|
||||
q: String,
|
||||
}
|
||||
|
||||
async fn create_index(mut cx: Context<Database>) -> EndpointResult<()> {
|
||||
let index: String = cx.param("index").client_err()?;
|
||||
let schema = cx.body_bytes().await.client_err()?;
|
||||
let schema = Schema::from_toml(schema.as_slice()).unwrap();
|
||||
|
||||
let database = cx.app_data();
|
||||
database.create_index(&index, schema).unwrap();
|
||||
|
||||
Ok(())
|
||||
}
|
||||
|
||||
async fn update_documents(mut cx: Context<Database>) -> EndpointResult<()> {
|
||||
let index: String = cx.param("index").client_err()?;
|
||||
let document: HashMap<String, Value> = cx.body_json().await.client_err()?;
|
||||
|
||||
let database = cx.app_data();
|
||||
let index = match database.open_index(&index).unwrap() {
|
||||
Some(index) => index,
|
||||
None => Err(StatusCode::NOT_FOUND)?,
|
||||
};
|
||||
|
||||
let mut addition = index.documents_addition();
|
||||
addition.update_document(document).unwrap();
|
||||
addition.finalize().unwrap();
|
||||
|
||||
Ok(())
|
||||
}
|
||||
|
||||
async fn search_index(cx: Context<Database>) -> EndpointResult {
|
||||
let index: String = cx.param("index").client_err()?;
|
||||
let query: SearchQuery = cx.url_query()?;
|
||||
|
||||
let database = cx.app_data();
|
||||
|
||||
let index = match database.open_index(&index).unwrap() {
|
||||
Some(index) => index,
|
||||
None => Err(StatusCode::NOT_FOUND)?,
|
||||
};
|
||||
|
||||
let documents_ids = index.query_builder().query(&query.q, 0..100).unwrap();
|
||||
let documents: Vec<Value> = documents_ids
|
||||
.into_iter()
|
||||
.filter_map(|x| index.document(None, x.id).unwrap())
|
||||
.collect();
|
||||
|
||||
Ok(response::json(documents))
|
||||
}
|
||||
|
||||
fn main() -> std::io::Result<()> {
|
||||
let tmp_dir = tempfile::tempdir().unwrap();
|
||||
let database = Database::start_default(&tmp_dir).unwrap();
|
||||
let mut app = App::new(database);
|
||||
|
||||
app.at("/:index").post(create_index).put(update_documents);
|
||||
app.at("/:index/search").get(search_index);
|
||||
|
||||
app.serve("127.0.0.1:8000")
|
||||
}
|
@ -1,121 +0,0 @@
|
||||
use std::cmp::Ordering;
|
||||
use std::error::Error;
|
||||
use std::fmt;
|
||||
|
||||
use meilidb_core::criterion::Criterion;
|
||||
use meilidb_core::RawDocument;
|
||||
use meilidb_data::{Schema, SchemaAttr, RankedMap};
|
||||
|
||||
/// An helper struct that permit to sort documents by
|
||||
/// some of their stored attributes.
|
||||
///
|
||||
/// # Note
|
||||
///
|
||||
/// If a document cannot be deserialized it will be considered [`None`][].
|
||||
///
|
||||
/// Deserialized documents are compared like `Some(doc0).cmp(&Some(doc1))`,
|
||||
/// so you must check the [`Ord`] of `Option` implementation.
|
||||
///
|
||||
/// [`None`]: https://doc.rust-lang.org/std/option/enum.Option.html#variant.None
|
||||
/// [`Ord`]: https://doc.rust-lang.org/std/option/enum.Option.html#impl-Ord
|
||||
///
|
||||
/// # Example
|
||||
///
|
||||
/// ```ignore
|
||||
/// use serde_derive::Deserialize;
|
||||
/// use meilidb::rank::criterion::*;
|
||||
///
|
||||
/// let custom_ranking = SortByAttr::lower_is_better(&ranked_map, &schema, "published_at")?;
|
||||
///
|
||||
/// let builder = CriteriaBuilder::with_capacity(8)
|
||||
/// .add(SumOfTypos)
|
||||
/// .add(NumberOfWords)
|
||||
/// .add(WordsProximity)
|
||||
/// .add(SumOfWordsAttribute)
|
||||
/// .add(SumOfWordsPosition)
|
||||
/// .add(Exact)
|
||||
/// .add(custom_ranking)
|
||||
/// .add(DocumentId);
|
||||
///
|
||||
/// let criterion = builder.build();
|
||||
///
|
||||
/// ```
|
||||
pub struct SortByAttr<'a> {
|
||||
ranked_map: &'a RankedMap,
|
||||
attr: SchemaAttr,
|
||||
reversed: bool,
|
||||
}
|
||||
|
||||
impl<'a> SortByAttr<'a> {
|
||||
pub fn lower_is_better(
|
||||
ranked_map: &'a RankedMap,
|
||||
schema: &Schema,
|
||||
attr_name: &str,
|
||||
) -> Result<SortByAttr<'a>, SortByAttrError>
|
||||
{
|
||||
SortByAttr::new(ranked_map, schema, attr_name, false)
|
||||
}
|
||||
|
||||
pub fn higher_is_better(
|
||||
ranked_map: &'a RankedMap,
|
||||
schema: &Schema,
|
||||
attr_name: &str,
|
||||
) -> Result<SortByAttr<'a>, SortByAttrError>
|
||||
{
|
||||
SortByAttr::new(ranked_map, schema, attr_name, true)
|
||||
}
|
||||
|
||||
fn new(
|
||||
ranked_map: &'a RankedMap,
|
||||
schema: &Schema,
|
||||
attr_name: &str,
|
||||
reversed: bool,
|
||||
) -> Result<SortByAttr<'a>, SortByAttrError>
|
||||
{
|
||||
let attr = match schema.attribute(attr_name) {
|
||||
Some(attr) => attr,
|
||||
None => return Err(SortByAttrError::AttributeNotFound),
|
||||
};
|
||||
|
||||
if !schema.props(attr).is_ranked() {
|
||||
return Err(SortByAttrError::AttributeNotRegisteredForRanking);
|
||||
}
|
||||
|
||||
Ok(SortByAttr { ranked_map, attr, reversed })
|
||||
}
|
||||
}
|
||||
|
||||
impl<'a> Criterion for SortByAttr<'a> {
|
||||
fn evaluate(&self, lhs: &RawDocument, rhs: &RawDocument) -> Ordering {
|
||||
let lhs = self.ranked_map.get(lhs.id, self.attr);
|
||||
let rhs = self.ranked_map.get(rhs.id, self.attr);
|
||||
|
||||
match (lhs, rhs) {
|
||||
(Some(lhs), Some(rhs)) => {
|
||||
let order = lhs.cmp(&rhs);
|
||||
if self.reversed { order.reverse() } else { order }
|
||||
},
|
||||
(None, Some(_)) => Ordering::Greater,
|
||||
(Some(_), None) => Ordering::Less,
|
||||
(None, None) => Ordering::Equal,
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
|
||||
pub enum SortByAttrError {
|
||||
AttributeNotFound,
|
||||
AttributeNotRegisteredForRanking,
|
||||
}
|
||||
|
||||
impl fmt::Display for SortByAttrError {
|
||||
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
||||
use SortByAttrError::*;
|
||||
match self {
|
||||
AttributeNotFound => f.write_str("attribute not found in the schema"),
|
||||
AttributeNotRegisteredForRanking => f.write_str("attribute not registered for ranking"),
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
impl Error for SortByAttrError { }
|
Loading…
x
Reference in New Issue
Block a user