2020-05-19 20:37:13 +08:00
|
|
|
use std::fmt::Write as _;
|
|
|
|
|
|
|
|
use indexmap::IndexMap;
|
|
|
|
use meilisearch_schema::IndexedPos;
|
|
|
|
use meilisearch_types::DocumentId;
|
2020-05-19 20:16:29 +08:00
|
|
|
use ordered_float::OrderedFloat;
|
2020-05-19 20:37:13 +08:00
|
|
|
use serde_json::Value;
|
|
|
|
|
2020-05-19 17:45:46 +08:00
|
|
|
use crate::Number;
|
2020-05-19 20:37:13 +08:00
|
|
|
use crate::raw_indexer::RawIndexer;
|
|
|
|
use crate::serde::SerializerError;
|
2020-05-19 17:45:46 +08:00
|
|
|
use crate::store::DiscoverIds;
|
2020-05-19 20:37:13 +08:00
|
|
|
|
|
|
|
/// Returns the number of words indexed or `None` if the type is unindexable.
|
|
|
|
pub fn index_value(
|
|
|
|
indexer: &mut RawIndexer,
|
|
|
|
document_id: DocumentId,
|
|
|
|
indexed_pos: IndexedPos,
|
|
|
|
value: &Value,
|
|
|
|
) -> Option<usize>
|
|
|
|
{
|
|
|
|
match value {
|
|
|
|
Value::Null => None,
|
|
|
|
Value::Bool(boolean) => {
|
|
|
|
let text = boolean.to_string();
|
|
|
|
let number_of_words = indexer.index_text(document_id, indexed_pos, &text);
|
|
|
|
Some(number_of_words)
|
|
|
|
},
|
|
|
|
Value::Number(number) => {
|
|
|
|
let text = number.to_string();
|
|
|
|
Some(indexer.index_text(document_id, indexed_pos, &text))
|
|
|
|
},
|
|
|
|
Value::String(string) => {
|
|
|
|
Some(indexer.index_text(document_id, indexed_pos, &string))
|
|
|
|
},
|
|
|
|
Value::Array(_) => {
|
|
|
|
let text = value_to_string(value);
|
|
|
|
Some(indexer.index_text(document_id, indexed_pos, &text))
|
|
|
|
},
|
|
|
|
Value::Object(_) => {
|
|
|
|
let text = value_to_string(value);
|
|
|
|
Some(indexer.index_text(document_id, indexed_pos, &text))
|
|
|
|
},
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Transforms the JSON Value type into a String.
|
|
|
|
pub fn value_to_string(value: &Value) -> String {
|
|
|
|
fn internal_value_to_string(string: &mut String, value: &Value) {
|
|
|
|
match value {
|
|
|
|
Value::Null => (),
|
|
|
|
Value::Bool(boolean) => { let _ = write!(string, "{}", &boolean); },
|
|
|
|
Value::Number(number) => { let _ = write!(string, "{}", &number); },
|
|
|
|
Value::String(text) => string.push_str(&text),
|
|
|
|
Value::Array(array) => {
|
|
|
|
for value in array {
|
|
|
|
internal_value_to_string(string, value);
|
|
|
|
let _ = string.write_str(". ");
|
|
|
|
}
|
|
|
|
},
|
|
|
|
Value::Object(object) => {
|
|
|
|
for (key, value) in object {
|
|
|
|
string.push_str(key);
|
|
|
|
let _ = string.write_str(". ");
|
|
|
|
internal_value_to_string(string, value);
|
|
|
|
let _ = string.write_str(". ");
|
|
|
|
}
|
|
|
|
},
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let mut string = String::new();
|
|
|
|
internal_value_to_string(&mut string, value);
|
|
|
|
string
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Transforms the JSON Value type into a Number.
|
|
|
|
pub fn value_to_number(value: &Value) -> Option<Number> {
|
|
|
|
use std::str::FromStr;
|
|
|
|
|
|
|
|
match value {
|
|
|
|
Value::Null => None,
|
|
|
|
Value::Bool(boolean) => Some(Number::Unsigned(*boolean as u64)),
|
2020-05-19 20:16:29 +08:00
|
|
|
Value::Number(number) => {
|
|
|
|
match (number.as_i64(), number.as_u64(), number.as_f64()) {
|
|
|
|
(Some(n), _, _) => Some(Number::Signed(n)),
|
|
|
|
(_, Some(n), _) => Some(Number::Unsigned(n)),
|
|
|
|
(_, _, Some(n)) => Some(Number::Float(OrderedFloat(n))),
|
|
|
|
(None, None, None) => None,
|
|
|
|
}
|
|
|
|
},
|
2020-05-19 20:37:13 +08:00
|
|
|
Value::String(string) => Number::from_str(string).ok(),
|
|
|
|
Value::Array(_array) => None,
|
|
|
|
Value::Object(_object) => None,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-05-19 17:45:46 +08:00
|
|
|
/// Validates a string representation to be a correct document id and returns
|
|
|
|
/// the corresponding id or generate a new one, this is the way we produce documents ids.
|
|
|
|
pub fn discover_document_id(
|
|
|
|
userid: &str,
|
|
|
|
user_ids: &fst::Map,
|
|
|
|
available_ids: &mut DiscoverIds<'_>,
|
|
|
|
) -> Result<DocumentId, SerializerError>
|
|
|
|
{
|
|
|
|
if userid.chars().all(|x| x.is_ascii_alphanumeric() || x == '-' || x == '_') {
|
|
|
|
match user_ids.get(userid) {
|
|
|
|
Some(internal_id) => Ok(DocumentId(internal_id)),
|
|
|
|
None => {
|
|
|
|
let internal_id = available_ids.next().expect("no more ids available");
|
|
|
|
Ok(internal_id)
|
|
|
|
},
|
|
|
|
}
|
2020-05-18 21:18:23 +08:00
|
|
|
} else {
|
|
|
|
Err(SerializerError::InvalidDocumentIdFormat)
|
|
|
|
}
|
2020-05-19 20:37:13 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/// Extracts and validates the document id of a document.
|
2020-05-19 17:45:46 +08:00
|
|
|
pub fn extract_document_id(
|
|
|
|
primary_key: &str,
|
|
|
|
document: &IndexMap<String, Value>,
|
|
|
|
user_ids: &fst::Map,
|
|
|
|
available_ids: &mut DiscoverIds<'_>,
|
|
|
|
) -> Result<(DocumentId, String), SerializerError>
|
|
|
|
{
|
2020-05-19 20:37:13 +08:00
|
|
|
match document.get(primary_key) {
|
|
|
|
Some(value) => {
|
2020-05-19 17:45:46 +08:00
|
|
|
let userid = match value {
|
2020-05-19 20:37:13 +08:00
|
|
|
Value::Number(number) => number.to_string(),
|
|
|
|
Value::String(string) => string.clone(),
|
|
|
|
_ => return Err(SerializerError::InvalidDocumentIdFormat),
|
|
|
|
};
|
2020-05-19 17:45:46 +08:00
|
|
|
discover_document_id(&userid, user_ids, available_ids).map(|id| (id, userid))
|
2020-05-19 20:37:13 +08:00
|
|
|
}
|
|
|
|
None => Err(SerializerError::DocumentIdNotFound),
|
|
|
|
}
|
|
|
|
}
|