2019-10-31 22:00:36 +08:00
|
|
|
use std::collections::HashMap;
|
|
|
|
use std::collections::HashSet;
|
|
|
|
use std::time::Duration;
|
|
|
|
|
|
|
|
use meilidb_core::Index;
|
|
|
|
use rayon::iter::{IntoParallelIterator, ParallelIterator};
|
|
|
|
use serde::{Deserialize, Serialize};
|
|
|
|
use tide::querystring::ContextExt as QSContextExt;
|
|
|
|
use tide::{Context, Response};
|
|
|
|
|
|
|
|
use crate::error::{ResponseError, SResult};
|
|
|
|
use crate::helpers::meilidb::{Error, IndexSearchExt, SearchHit};
|
|
|
|
use crate::helpers::tide::ContextExt;
|
|
|
|
use crate::Data;
|
|
|
|
|
|
|
|
#[derive(Deserialize)]
|
|
|
|
#[serde(rename_all = "camelCase", deny_unknown_fields)]
|
|
|
|
struct SearchQuery {
|
|
|
|
q: String,
|
|
|
|
offset: Option<usize>,
|
|
|
|
limit: Option<usize>,
|
|
|
|
attributes_to_retrieve: Option<String>,
|
|
|
|
attributes_to_search_in: Option<String>,
|
|
|
|
attributes_to_crop: Option<String>,
|
|
|
|
crop_length: Option<usize>,
|
|
|
|
attributes_to_highlight: Option<String>,
|
|
|
|
filters: Option<String>,
|
|
|
|
timeout_ms: Option<u64>,
|
|
|
|
matches: Option<bool>,
|
|
|
|
}
|
|
|
|
|
|
|
|
pub async fn search_with_url_query(ctx: Context<Data>) -> SResult<Response> {
|
|
|
|
// ctx.is_allowed(DocumentsRead)?;
|
|
|
|
|
|
|
|
let index = ctx.index()?;
|
|
|
|
let env = &ctx.state().db.env;
|
|
|
|
let reader = env.read_txn().map_err(ResponseError::internal)?;
|
|
|
|
|
2019-11-15 19:04:46 +08:00
|
|
|
let schema = index
|
|
|
|
.main
|
|
|
|
.schema(&reader)
|
|
|
|
.map_err(ResponseError::internal)?
|
|
|
|
.ok_or(ResponseError::open_index("No Schema found"))?;
|
|
|
|
|
2019-10-31 22:00:36 +08:00
|
|
|
let query: SearchQuery = ctx
|
|
|
|
.url_query()
|
|
|
|
.map_err(|_| ResponseError::bad_request("invalid query parameter"))?;
|
|
|
|
|
|
|
|
let mut search_builder = index.new_search(query.q.clone());
|
|
|
|
|
|
|
|
if let Some(offset) = query.offset {
|
|
|
|
search_builder.offset(offset);
|
|
|
|
}
|
|
|
|
if let Some(limit) = query.limit {
|
|
|
|
search_builder.limit(limit);
|
|
|
|
}
|
|
|
|
|
|
|
|
if let Some(attributes_to_retrieve) = query.attributes_to_retrieve {
|
|
|
|
for attr in attributes_to_retrieve.split(',') {
|
|
|
|
search_builder.add_retrievable_field(attr.to_string());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if let Some(attributes_to_search_in) = query.attributes_to_search_in {
|
|
|
|
for attr in attributes_to_search_in.split(',') {
|
2019-11-13 01:25:33 +08:00
|
|
|
search_builder.add_attribute_to_search_in(attr.to_string());
|
2019-10-31 22:00:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
if let Some(attributes_to_crop) = query.attributes_to_crop {
|
|
|
|
let crop_length = query.crop_length.unwrap_or(200);
|
2019-11-15 19:04:46 +08:00
|
|
|
if attributes_to_crop == "*" {
|
|
|
|
let attributes_to_crop = schema
|
|
|
|
.iter()
|
|
|
|
.map(|(attr, ..)| (attr.to_string(), crop_length))
|
|
|
|
.collect();
|
|
|
|
search_builder.attributes_to_crop(attributes_to_crop);
|
|
|
|
} else {
|
|
|
|
let attributes_to_crop = attributes_to_crop
|
|
|
|
.split(',')
|
|
|
|
.map(|r| (r.to_string(), crop_length))
|
|
|
|
.collect();
|
|
|
|
search_builder.attributes_to_crop(attributes_to_crop);
|
|
|
|
}
|
2019-10-31 22:00:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if let Some(attributes_to_highlight) = query.attributes_to_highlight {
|
2019-11-15 19:04:46 +08:00
|
|
|
let attributes_to_highlight = if attributes_to_highlight == "*" {
|
|
|
|
schema.iter().map(|(attr, ..)| attr.to_string()).collect()
|
|
|
|
} else {
|
|
|
|
attributes_to_highlight
|
|
|
|
.split(',')
|
|
|
|
.map(ToString::to_string)
|
|
|
|
.collect()
|
|
|
|
};
|
|
|
|
|
2019-10-31 22:00:36 +08:00
|
|
|
search_builder.attributes_to_highlight(attributes_to_highlight);
|
|
|
|
}
|
|
|
|
|
|
|
|
if let Some(filters) = query.filters {
|
|
|
|
search_builder.filters(filters);
|
|
|
|
}
|
|
|
|
|
|
|
|
if let Some(timeout_ms) = query.timeout_ms {
|
|
|
|
search_builder.timeout(Duration::from_millis(timeout_ms));
|
|
|
|
}
|
|
|
|
|
|
|
|
if let Some(matches) = query.matches {
|
|
|
|
if matches {
|
|
|
|
search_builder.get_matches();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let response = match search_builder.search(&reader) {
|
|
|
|
Ok(response) => response,
|
|
|
|
Err(Error::Internal(message)) => return Err(ResponseError::Internal(message)),
|
|
|
|
Err(others) => return Err(ResponseError::bad_request(others)),
|
|
|
|
};
|
|
|
|
|
|
|
|
Ok(tide::response::json(response))
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Clone, Deserialize)]
|
|
|
|
#[serde(rename_all = "camelCase", deny_unknown_fields)]
|
|
|
|
struct SearchMultiBody {
|
|
|
|
indexes: HashSet<String>,
|
|
|
|
query: String,
|
|
|
|
offset: Option<usize>,
|
|
|
|
limit: Option<usize>,
|
|
|
|
attributes_to_retrieve: Option<HashSet<String>>,
|
|
|
|
attributes_to_search_in: Option<HashSet<String>>,
|
|
|
|
attributes_to_crop: Option<HashMap<String, usize>>,
|
|
|
|
attributes_to_highlight: Option<HashSet<String>>,
|
|
|
|
filters: Option<String>,
|
|
|
|
timeout_ms: Option<u64>,
|
|
|
|
matches: Option<bool>,
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug, Clone, Serialize)]
|
|
|
|
#[serde(rename_all = "camelCase")]
|
|
|
|
struct SearchMultiBodyResponse {
|
|
|
|
hits: HashMap<String, Vec<SearchHit>>,
|
|
|
|
offset: usize,
|
|
|
|
hits_per_page: usize,
|
|
|
|
processing_time_ms: usize,
|
|
|
|
query: String,
|
|
|
|
}
|
|
|
|
|
|
|
|
pub async fn search_multi_index(mut ctx: Context<Data>) -> SResult<Response> {
|
|
|
|
// ctx.is_allowed(DocumentsRead)?;
|
|
|
|
let body = ctx
|
|
|
|
.body_json::<SearchMultiBody>()
|
|
|
|
.await
|
|
|
|
.map_err(ResponseError::bad_request)?;
|
|
|
|
|
|
|
|
let mut index_list = body.clone().indexes;
|
|
|
|
|
|
|
|
for index in index_list.clone() {
|
|
|
|
if index == "*" {
|
|
|
|
index_list = ctx
|
|
|
|
.state()
|
|
|
|
.db
|
2019-11-20 00:38:02 +08:00
|
|
|
.indexes_uids()
|
2019-10-31 22:00:36 +08:00
|
|
|
.into_iter()
|
|
|
|
.collect();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let mut offset = 0;
|
|
|
|
let mut count = 20;
|
|
|
|
|
|
|
|
if let Some(body_offset) = body.offset {
|
|
|
|
if let Some(limit) = body.limit {
|
|
|
|
offset = body_offset;
|
|
|
|
count = limit;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let offset = offset;
|
|
|
|
let count = count;
|
|
|
|
let db = &ctx.state().db;
|
|
|
|
let par_body = body.clone();
|
|
|
|
let responses_per_index: Vec<SResult<_>> = index_list
|
|
|
|
.into_par_iter()
|
2019-11-19 23:15:49 +08:00
|
|
|
.map(move |index_uid| {
|
2019-10-31 22:00:36 +08:00
|
|
|
let index: Index = db
|
2019-11-19 23:15:49 +08:00
|
|
|
.open_index(&index_uid)
|
|
|
|
.ok_or(ResponseError::index_not_found(&index_uid))?;
|
2019-10-31 22:00:36 +08:00
|
|
|
|
|
|
|
let mut search_builder = index.new_search(par_body.query.clone());
|
|
|
|
|
|
|
|
search_builder.offset(offset);
|
|
|
|
search_builder.limit(count);
|
|
|
|
|
|
|
|
if let Some(attributes_to_retrieve) = par_body.attributes_to_retrieve.clone() {
|
|
|
|
search_builder.attributes_to_retrieve(attributes_to_retrieve);
|
|
|
|
}
|
|
|
|
if let Some(attributes_to_search_in) = par_body.attributes_to_search_in.clone() {
|
|
|
|
search_builder.attributes_to_search_in(attributes_to_search_in);
|
|
|
|
}
|
|
|
|
if let Some(attributes_to_crop) = par_body.attributes_to_crop.clone() {
|
|
|
|
search_builder.attributes_to_crop(attributes_to_crop);
|
|
|
|
}
|
|
|
|
if let Some(attributes_to_highlight) = par_body.attributes_to_highlight.clone() {
|
|
|
|
search_builder.attributes_to_highlight(attributes_to_highlight);
|
|
|
|
}
|
|
|
|
if let Some(filters) = par_body.filters.clone() {
|
|
|
|
search_builder.filters(filters);
|
|
|
|
}
|
|
|
|
if let Some(timeout_ms) = par_body.timeout_ms {
|
|
|
|
search_builder.timeout(Duration::from_secs(timeout_ms));
|
|
|
|
}
|
|
|
|
if let Some(matches) = par_body.matches {
|
|
|
|
if matches {
|
|
|
|
search_builder.get_matches();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let env = &db.env;
|
|
|
|
let reader = env.read_txn().map_err(ResponseError::internal)?;
|
|
|
|
|
|
|
|
let response = search_builder
|
|
|
|
.search(&reader)
|
|
|
|
.map_err(ResponseError::internal)?;
|
2019-11-19 23:15:49 +08:00
|
|
|
Ok((index_uid, response))
|
2019-10-31 22:00:36 +08:00
|
|
|
})
|
|
|
|
.collect();
|
|
|
|
|
|
|
|
let mut hits_map = HashMap::new();
|
|
|
|
|
|
|
|
let mut max_query_time = 0;
|
|
|
|
|
|
|
|
for response in responses_per_index {
|
2019-11-19 23:15:49 +08:00
|
|
|
if let Ok((index_uid, response)) = response {
|
2019-10-31 22:00:36 +08:00
|
|
|
if response.processing_time_ms > max_query_time {
|
|
|
|
max_query_time = response.processing_time_ms;
|
|
|
|
}
|
2019-11-19 23:15:49 +08:00
|
|
|
hits_map.insert(index_uid, response.hits);
|
2019-10-31 22:00:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let response = SearchMultiBodyResponse {
|
|
|
|
hits: hits_map,
|
|
|
|
offset,
|
|
|
|
hits_per_page: count,
|
|
|
|
processing_time_ms: max_query_time,
|
|
|
|
query: body.query,
|
|
|
|
};
|
|
|
|
|
|
|
|
Ok(tide::response::json(response))
|
|
|
|
}
|