2018-10-10 16:57:21 +02:00
|
|
|
pub mod criterion;
|
2018-12-07 11:53:17 +01:00
|
|
|
mod query_builder;
|
2018-11-28 17:12:24 +01:00
|
|
|
mod distinct_map;
|
2018-07-07 14:43:29 +02:00
|
|
|
|
2019-01-06 11:11:55 +01:00
|
|
|
use std::slice::Windows;
|
|
|
|
|
|
|
|
use sdset::SetBuf;
|
|
|
|
use group_by::GroupBy;
|
|
|
|
|
2018-09-09 11:13:58 +02:00
|
|
|
use crate::{Match, DocumentId};
|
2018-05-27 15:23:43 +02:00
|
|
|
|
2018-12-29 20:16:29 +01:00
|
|
|
pub use self::query_builder::{FilterFunc, QueryBuilder, DistinctQueryBuilder};
|
2018-05-27 15:23:43 +02:00
|
|
|
|
2018-06-25 22:26:49 +02:00
|
|
|
#[inline]
|
|
|
|
fn match_query_index(a: &Match, b: &Match) -> bool {
|
|
|
|
a.query_index == b.query_index
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug, Clone)]
|
2018-05-27 15:23:43 +02:00
|
|
|
pub struct Document {
|
2018-10-10 16:57:21 +02:00
|
|
|
pub id: DocumentId,
|
2019-01-06 11:11:55 +01:00
|
|
|
pub matches: Matches,
|
2018-05-27 15:23:43 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Document {
|
2019-01-06 11:23:21 +01:00
|
|
|
pub fn new(id: DocumentId, match_: Match) -> Self {
|
2019-01-06 11:11:55 +01:00
|
|
|
let matches = SetBuf::new_unchecked(vec![match_]);
|
2019-01-06 11:23:21 +01:00
|
|
|
Self::from_matches(id, matches)
|
2018-05-27 15:23:43 +02:00
|
|
|
}
|
|
|
|
|
2019-01-06 11:11:55 +01:00
|
|
|
pub fn from_matches(id: DocumentId, matches: SetBuf<Match>) -> Self {
|
2019-01-06 11:23:21 +01:00
|
|
|
let matches = Matches::new(matches);
|
|
|
|
Self { id, matches }
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn from_unsorted_matches(id: DocumentId, matches: Vec<Match>) -> Self {
|
|
|
|
let matches = Matches::from_unsorted(matches);
|
|
|
|
Self { id, matches }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug, Clone)]
|
|
|
|
pub struct Matches {
|
|
|
|
matches: SetBuf<Match>,
|
|
|
|
slices: Vec<usize>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Matches {
|
|
|
|
pub fn new(matches: SetBuf<Match>) -> Matches {
|
2019-01-06 11:11:55 +01:00
|
|
|
let mut last = 0;
|
|
|
|
let mut slices = vec![0];
|
2019-01-06 11:23:21 +01:00
|
|
|
|
2019-01-06 11:11:55 +01:00
|
|
|
for group in GroupBy::new(&matches, match_query_index) {
|
|
|
|
let index = last + group.len();
|
|
|
|
slices.push(index);
|
|
|
|
last = index;
|
|
|
|
}
|
|
|
|
|
2019-01-06 11:23:21 +01:00
|
|
|
Matches { matches, slices }
|
2019-01-06 11:11:55 +01:00
|
|
|
}
|
|
|
|
|
2019-01-06 11:23:21 +01:00
|
|
|
pub fn from_unsorted(mut matches: Vec<Match>) -> Matches {
|
2018-10-21 16:42:19 +02:00
|
|
|
matches.sort_unstable();
|
2019-01-06 11:11:55 +01:00
|
|
|
let matches = SetBuf::new_unchecked(matches);
|
2019-01-06 11:23:21 +01:00
|
|
|
Matches::new(matches)
|
2018-10-21 16:42:19 +02:00
|
|
|
}
|
2019-01-06 11:11:55 +01:00
|
|
|
|
|
|
|
pub fn query_index_groups(&self) -> QueryIndexGroups {
|
|
|
|
QueryIndexGroups {
|
|
|
|
matches: &self.matches,
|
|
|
|
windows: self.slices.windows(2),
|
|
|
|
}
|
2018-05-27 15:23:43 +02:00
|
|
|
}
|
|
|
|
}
|
2019-01-06 11:11:55 +01:00
|
|
|
|
|
|
|
pub struct QueryIndexGroups<'a, 'b> {
|
|
|
|
matches: &'a [Match],
|
|
|
|
windows: Windows<'b, usize>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a, 'b> Iterator for QueryIndexGroups<'a, 'b> {
|
|
|
|
type Item = &'a [Match];
|
|
|
|
|
|
|
|
fn next(&mut self) -> Option<Self::Item> {
|
|
|
|
self.windows.next().map(|range| {
|
|
|
|
match *range {
|
|
|
|
[left, right] => &self.matches[left..right],
|
2019-01-06 11:23:21 +01:00
|
|
|
_ => unreachable!(),
|
2019-01-06 11:11:55 +01:00
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// impl ExactSizeIterator for QueryIndexGroups<'_, '_> {
|
|
|
|
// fn len(&self) -> usize {
|
|
|
|
// self.windows.len() // FIXME (+1) ?
|
|
|
|
// }
|
|
|
|
// }
|