mod docs_words; mod documents_fields; mod documents_fields_counts; mod main; mod postings_lists; mod synonyms; mod updates; mod updates_results; pub use self::docs_words::DocsWords; pub use self::documents_fields::{DocumentsFields, DocumentFieldsIter}; pub use self::documents_fields_counts::{DocumentsFieldsCounts, DocumentFieldsCountsIter, DocumentsIdsIter}; pub use self::main::Main; pub use self::postings_lists::PostingsLists; pub use self::synonyms::Synonyms; pub use self::updates::Updates; pub use self::updates_results::UpdatesResults; use std::collections::HashSet; use std::convert::TryFrom; use meilidb_schema::{Schema, SchemaAttr}; use serde::de; use crate::criterion::Criteria; use crate::serde::Deserializer; use crate::{update, query_builder::QueryBuilder, DocumentId, MResult, Error}; fn aligned_to(bytes: &[u8], align: usize) -> bool { (bytes as *const _ as *const () as usize) % align == 0 } fn document_attribute_into_key(document_id: DocumentId, attribute: SchemaAttr) -> [u8; 10] { let document_id_bytes = document_id.0.to_be_bytes(); let attr_bytes = attribute.0.to_be_bytes(); let mut key = [0u8; 10]; key[0..8].copy_from_slice(&document_id_bytes); key[8..10].copy_from_slice(&attr_bytes); key } fn document_attribute_from_key(key: [u8; 10]) -> (DocumentId, SchemaAttr) { let document_id = { let array = TryFrom::try_from(&key[0..8]).unwrap(); DocumentId(u64::from_be_bytes(array)) }; let schema_attr = { let array = TryFrom::try_from(&key[8..8+2]).unwrap(); SchemaAttr(u16::from_be_bytes(array)) }; (document_id, schema_attr) } fn main_name(name: &str) -> String { format!("store-{}", name) } fn postings_lists_name(name: &str) -> String { format!("store-{}-postings-lists", name) } fn documents_fields_name(name: &str) -> String { format!("store-{}-documents-fields", name) } fn documents_fields_counts_name(name: &str) -> String { format!("store-{}-documents-fields-counts", name) } fn synonyms_name(name: &str) -> String { format!("store-{}-synonyms", name) } fn docs_words_name(name: &str) -> String { format!("store-{}-docs-words", name) } fn updates_name(name: &str) -> String { format!("store-{}-updates", name) } fn updates_results_name(name: &str) -> String { format!("store-{}-updates-results", name) } #[derive(Clone)] pub struct Index { pub main: Main, pub postings_lists: PostingsLists, pub documents_fields: DocumentsFields, pub documents_fields_counts: DocumentsFieldsCounts, pub synonyms: Synonyms, pub docs_words: DocsWords, pub updates: Updates, pub updates_results: UpdatesResults, updates_notifier: crossbeam_channel::Sender<()>, } impl Index { pub fn document( &self, reader: &R, attributes: Option<&HashSet<&str>>, document_id: DocumentId, ) -> MResult> { let schema = self.main.schema(reader)?; let schema = schema.ok_or(Error::SchemaMissing)?; let attributes = match attributes { Some(attributes) => attributes.into_iter().map(|name| schema.attribute(name)).collect(), None => None, }; let mut deserializer = Deserializer { document_id, reader, documents_fields: self.documents_fields, schema: &schema, attributes: attributes.as_ref(), }; // TODO: currently we return an error if all document fields are missing, // returning None would have been better Ok(T::deserialize(&mut deserializer).map(Some)?) } pub fn document_attribute( &self, reader: &R, document_id: DocumentId, attribute: SchemaAttr, ) -> MResult> { let bytes = self.documents_fields.document_attribute(reader, document_id, attribute)?; match bytes { Some(bytes) => Ok(Some(serde_json::from_slice(bytes)?)), None => Ok(None), } } pub fn schema_update(&self, writer: &mut rkv::Writer, schema: Schema) -> MResult { let _ = self.updates_notifier.send(()); update::push_schema_update(writer, self.updates, self.updates_results, schema) } pub fn customs_update(&self, writer: &mut rkv::Writer, customs: Vec) -> MResult { let _ = self.updates_notifier.send(()); update::push_customs_update(writer, self.updates, self.updates_results, customs) } pub fn documents_addition(&self) -> update::DocumentsAddition { update::DocumentsAddition::new( self.updates, self.updates_results, self.updates_notifier.clone(), ) } pub fn documents_deletion(&self) -> update::DocumentsDeletion { update::DocumentsDeletion::new( self.updates, self.updates_results, self.updates_notifier.clone(), ) } pub fn synonyms_addition(&self) -> update::SynonymsAddition { update::SynonymsAddition::new( self.updates, self.updates_results, self.updates_notifier.clone(), ) } pub fn synonyms_deletion(&self) -> update::SynonymsDeletion { update::SynonymsDeletion::new( self.updates, self.updates_results, self.updates_notifier.clone(), ) } pub fn update_status( &self, reader: &T, update_id: u64, ) -> MResult { update::update_status( reader, self.updates, self.updates_results, update_id, ) } pub fn query_builder(&self) -> QueryBuilder { QueryBuilder::new(self.main, self.postings_lists, self.synonyms) } pub fn query_builder_with_criteria<'c>(&self, criteria: Criteria<'c>) -> QueryBuilder<'c> { QueryBuilder::with_criteria(self.main, self.postings_lists, self.synonyms, criteria) } } pub fn create( env: &rkv::Rkv, name: &str, updates_notifier: crossbeam_channel::Sender<()>, ) -> Result { open_options(env, name, rkv::StoreOptions::create(), updates_notifier) } pub fn open( env: &rkv::Rkv, name: &str, updates_notifier: crossbeam_channel::Sender<()>, ) -> Result { let mut options = rkv::StoreOptions::default(); options.create = false; open_options(env, name, options, updates_notifier) } fn open_options( env: &rkv::Rkv, name: &str, options: rkv::StoreOptions, updates_notifier: crossbeam_channel::Sender<()>, ) -> Result { // create all the store names let main_name = main_name(name); let postings_lists_name = postings_lists_name(name); let documents_fields_name = documents_fields_name(name); let documents_fields_counts_name = documents_fields_counts_name(name); let synonyms_name = synonyms_name(name); let docs_words_name = docs_words_name(name); let updates_name = updates_name(name); let updates_results_name = updates_results_name(name); // open all the stores let main = env.open_single(main_name.as_str(), options)?; let postings_lists = env.open_single(postings_lists_name.as_str(), options)?; let documents_fields = env.open_single(documents_fields_name.as_str(), options)?; let documents_fields_counts = env.open_single(documents_fields_counts_name.as_str(), options)?; let synonyms = env.open_single(synonyms_name.as_str(), options)?; let docs_words = env.open_single(docs_words_name.as_str(), options)?; let updates = env.open_single(updates_name.as_str(), options)?; let updates_results = env.open_single(updates_results_name.as_str(), options)?; Ok(Index { main: Main { main }, postings_lists: PostingsLists { postings_lists }, documents_fields: DocumentsFields { documents_fields }, documents_fields_counts: DocumentsFieldsCounts { documents_fields_counts }, synonyms: Synonyms { synonyms }, docs_words: DocsWords { docs_words }, updates: Updates { updates }, updates_results: UpdatesResults { updates_results }, updates_notifier, }) }