fix escaped quotes in filter

This commit is contained in:
Tamo 2022-06-09 16:03:49 +02:00
parent 9580b9de79
commit 90afde435b
No known key found for this signature in database
GPG Key ID: 20CD8020AFA88D69
2 changed files with 78 additions and 14 deletions

View File

@ -40,7 +40,6 @@ mod error;
mod value; mod value;
use std::fmt::Debug; use std::fmt::Debug;
use std::ops::Deref;
use std::str::FromStr; use std::str::FromStr;
pub use condition::{parse_condition, parse_to, Condition}; pub use condition::{parse_condition, parse_to, Condition};
@ -70,14 +69,6 @@ pub struct Token<'a> {
value: Option<String>, value: Option<String>,
} }
impl<'a> Deref for Token<'a> {
type Target = &'a str;
fn deref(&self) -> &Self::Target {
&self.span
}
}
impl<'a> PartialEq for Token<'a> { impl<'a> PartialEq for Token<'a> {
fn eq(&self, other: &Self) -> bool { fn eq(&self, other: &Self) -> bool {
self.span.fragment() == other.span.fragment() self.span.fragment() == other.span.fragment()
@ -89,6 +80,10 @@ impl<'a> Token<'a> {
Self { span, value } Self { span, value }
} }
pub fn lexeme(&self) -> &str {
&self.span
}
pub fn value(&self) -> &str { pub fn value(&self) -> &str {
self.value.as_ref().map_or(&self.span, |value| value) self.value.as_ref().map_or(&self.span, |value| value)
} }

View File

@ -1,7 +1,6 @@
use std::collections::HashSet; use std::collections::HashSet;
use std::fmt::{Debug, Display}; use std::fmt::{Debug, Display};
use std::ops::Bound::{self, Excluded, Included}; use std::ops::Bound::{self, Excluded, Included};
use std::ops::Deref;
use either::Either; use either::Either;
pub use filter_parser::{Condition, Error as FPError, FilterCondition, Span, Token}; pub use filter_parser::{Condition, Error as FPError, FilterCondition, Span, Token};
@ -283,8 +282,9 @@ impl<'a> Filter<'a> {
Condition::LowerThanOrEqual(val) => (Included(f64::MIN), Included(val.parse()?)), Condition::LowerThanOrEqual(val) => (Included(f64::MIN), Included(val.parse()?)),
Condition::Between { from, to } => (Included(from.parse()?), Included(to.parse()?)), Condition::Between { from, to } => (Included(from.parse()?), Included(to.parse()?)),
Condition::Equal(val) => { Condition::Equal(val) => {
let (_original_value, string_docids) = let (_original_value, string_docids) = strings_db
strings_db.get(rtxn, &(field_id, &val.to_lowercase()))?.unwrap_or_default(); .get(rtxn, &(field_id, &val.value().to_lowercase()))?
.unwrap_or_default();
let number = val.parse::<f64>().ok(); let number = val.parse::<f64>().ok();
let number_docids = match number { let number_docids = match number {
Some(n) => { Some(n) => {
@ -362,7 +362,7 @@ impl<'a> Filter<'a> {
return Ok(RoaringBitmap::new()); return Ok(RoaringBitmap::new());
} }
} else { } else {
match *fid.deref() { match fid.lexeme() {
attribute @ "_geo" => { attribute @ "_geo" => {
return Err(fid.as_external_error(FilterError::BadGeo(attribute)))?; return Err(fid.as_external_error(FilterError::BadGeo(attribute)))?;
} }
@ -461,7 +461,7 @@ mod tests {
use maplit::hashset; use maplit::hashset;
use super::*; use super::*;
use crate::update::{IndexerConfig, Settings}; use crate::update::{self, IndexDocuments, IndexDocumentsConfig, IndexerConfig, Settings};
use crate::Index; use crate::Index;
#[test] #[test]
@ -598,6 +598,75 @@ mod tests {
)); ));
} }
#[test]
fn escaped_quote_in_filter_value_2380() {
let path = tempfile::tempdir().unwrap();
let mut options = EnvOpenOptions::new();
options.map_size(10 * 1024 * 1024); // 10 MB
let index = Index::new(options, &path).unwrap();
let mut wtxn = index.write_txn().unwrap();
let content = documents!([
{
"id": "test_1",
"monitor_diagonal": "27' to 30'"
},
{
"id": "test_2",
"monitor_diagonal": "27\" to 30\""
},
{
"id": "test_3",
"monitor_diagonal": "27\" to 30'"
},
]);
let config = IndexerConfig::default();
let indexing_config = IndexDocumentsConfig::default();
let mut builder =
IndexDocuments::new(&mut wtxn, &index, &config, indexing_config.clone(), |_| ())
.unwrap();
builder.add_documents(content).unwrap();
builder.execute().unwrap();
wtxn.commit().unwrap();
let mut wtxn = index.write_txn().unwrap();
let mut builder = update::Settings::new(&mut wtxn, &index, &config);
builder.set_filterable_fields(hashset!(S("monitor_diagonal")));
builder.execute(|_| ()).unwrap();
wtxn.commit().unwrap();
let rtxn = index.read_txn().unwrap();
let mut search = crate::Search::new(&rtxn, &index);
// this filter is copy pasted from #2380 with the exact same espace sequence
search.filter(
crate::Filter::from_str("monitor_diagonal = '27\" to 30\\''").unwrap().unwrap(),
);
let crate::SearchResult { documents_ids, .. } = search.execute().unwrap();
assert_eq!(documents_ids, vec![2]);
search.filter(
crate::Filter::from_str(r#"monitor_diagonal = "27' to 30'" "#).unwrap().unwrap(),
);
let crate::SearchResult { documents_ids, .. } = search.execute().unwrap();
assert_eq!(documents_ids, vec![0]);
search.filter(
crate::Filter::from_str(r#"monitor_diagonal = "27\" to 30\"" "#).unwrap().unwrap(),
);
let crate::SearchResult { documents_ids, .. } = search.execute().unwrap();
assert_eq!(documents_ids, vec![1]);
search.filter(
crate::Filter::from_str(r#"monitor_diagonal = "27\" to 30'" "#).unwrap().unwrap(),
);
let crate::SearchResult { documents_ids, .. } = search.execute().unwrap();
assert_eq!(documents_ids, vec![2]);
}
#[test] #[test]
fn geo_radius_error() { fn geo_radius_error() {
let path = tempfile::tempdir().unwrap(); let path = tempfile::tempdir().unwrap();