meilisearch/milli/src/criterion.rs

83 lines
2.9 KiB
Rust
Raw Normal View History

use std::collections::HashMap;
use std::fmt;
2020-11-27 19:14:56 +08:00
2020-12-04 19:02:22 +08:00
use anyhow::{Context, bail};
use regex::Regex;
2020-11-27 19:14:56 +08:00
use serde::{Serialize, Deserialize};
use once_cell::sync::Lazy;
2020-11-27 19:14:56 +08:00
use crate::facet::FacetType;
static ASC_DESC_REGEX: Lazy<Regex> = Lazy::new(|| {
Regex::new(r#"(asc|desc)\(([\w_-]+)\)"#).unwrap()
});
#[derive(Debug, Serialize, Deserialize, Clone, PartialEq, Eq)]
2020-08-12 16:43:02 +08:00
pub enum Criterion {
/// Sorted by decreasing number of matched query terms.
/// Query words at the front of an attribute is considered better than if it was at the back.
2020-08-12 16:43:02 +08:00
Words,
/// Sorted by increasing number of typos.
Typo,
2020-08-12 16:43:02 +08:00
/// Sorted by increasing distance between matched query terms.
Proximity,
/// Documents with quey words contained in more important
/// attributes are considred better.
Attribute,
/// Sorted by the similarity of the matched words with the query words.
Exactness,
/// Sorted by the increasing value of the field specified.
Asc(String),
2020-08-12 16:43:02 +08:00
/// Sorted by the decreasing value of the field specified.
Desc(String),
2020-08-12 16:43:02 +08:00
}
2020-12-04 19:02:22 +08:00
impl Criterion {
pub fn from_str(faceted_attributes: &HashMap<String, FacetType>, txt: &str) -> anyhow::Result<Criterion> {
2020-12-04 19:02:22 +08:00
match txt {
"words" => Ok(Criterion::Words),
"typo" => Ok(Criterion::Typo),
2020-12-04 19:02:22 +08:00
"proximity" => Ok(Criterion::Proximity),
"attribute" => Ok(Criterion::Attribute),
"exactness" => Ok(Criterion::Exactness),
text => {
let caps = ASC_DESC_REGEX.captures(text).with_context(|| format!("unknown criterion name: {}", text))?;
2020-12-04 19:02:22 +08:00
let order = caps.get(1).unwrap().as_str();
let field_name = caps.get(2).unwrap().as_str();
faceted_attributes.get(field_name).with_context(|| format!("Can't use {:?} as a criterion as it isn't a faceted field.", field_name))?;
2020-12-04 19:02:22 +08:00
match order {
"asc" => Ok(Criterion::Asc(field_name.to_string())),
"desc" => Ok(Criterion::Desc(field_name.to_string())),
2020-12-04 19:02:22 +08:00
otherwise => bail!("unknown criterion name: {}", otherwise),
}
},
}
}
}
2020-08-12 16:43:02 +08:00
pub fn default_criteria() -> Vec<Criterion> {
vec![
Criterion::Words,
Criterion::Typo,
2020-08-12 16:43:02 +08:00
Criterion::Proximity,
Criterion::Attribute,
Criterion::Exactness,
]
}
impl fmt::Display for Criterion {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
use Criterion::*;
match self {
Words => f.write_str("words"),
Typo => f.write_str("typo"),
Proximity => f.write_str("proximity"),
Attribute => f.write_str("attribute"),
Exactness => f.write_str("exactness"),
2021-03-08 19:09:09 +08:00
Asc(attr) => write!(f, "asc({})", attr),
Desc(attr) => write!(f, "desc({})", attr),
}
}
}