meilisearch/meilidb-core/src/database.rs

201 lines
6.6 KiB
Rust
Raw Normal View History

2019-10-18 19:05:28 +08:00
use std::collections::hash_map::{Entry, HashMap};
use std::fs::File;
use std::path::Path;
use std::sync::{Arc, RwLock};
use std::{fs, thread};
use crossbeam_channel::Receiver;
2019-10-21 18:05:53 +08:00
use heed::types::{Str, Unit};
use heed::{CompactionOption, Result as ZResult};
use log::{debug, error};
use crate::{store, update, Index, MResult};
2019-10-09 17:45:19 +08:00
pub type BoxUpdateFn = Box<dyn Fn(update::UpdateResult) + Send + Sync + 'static>;
type ArcSwapFn = arc_swap::ArcSwapOption<BoxUpdateFn>;
pub struct Database {
2019-10-21 18:05:53 +08:00
pub env: heed::Env,
common_store: heed::PolyDatabase,
indexes_store: heed::Database<Str, Unit>,
2019-10-09 17:45:19 +08:00
indexes: RwLock<HashMap<String, (Index, Arc<ArcSwapFn>, thread::JoinHandle<()>)>>,
}
2019-10-21 18:05:53 +08:00
fn update_awaiter(receiver: Receiver<()>, env: heed::Env, update_fn: Arc<ArcSwapFn>, index: Index) {
for () in receiver {
// consume all updates in order (oldest first)
loop {
2019-10-16 23:05:24 +08:00
let mut writer = match env.write_txn() {
Ok(writer) => writer,
2019-10-18 19:05:28 +08:00
Err(e) => {
error!("LMDB writer transaction begin failed: {}", e);
break;
}
};
2019-10-09 23:23:48 +08:00
match update::update_task(&mut writer, index.clone()) {
Ok(Some(status)) => {
2019-10-18 19:05:28 +08:00
if let Err(e) = writer.commit() {
error!("update transaction failed: {}", e)
}
2019-10-09 23:23:48 +08:00
if let Some(ref callback) = *update_fn.load() {
(callback)(status);
}
2019-10-18 19:05:28 +08:00
}
// no more updates to handle for now
2019-10-18 19:05:28 +08:00
Ok(None) => {
debug!("no more updates");
writer.abort();
break;
}
Err(e) => {
error!("update task failed: {}", e);
writer.abort()
}
}
}
}
}
impl Database {
pub fn open_or_create(path: impl AsRef<Path>) -> MResult<Database> {
fs::create_dir_all(path.as_ref())?;
2019-10-21 18:05:53 +08:00
let env = heed::EnvOpenOptions::new()
2019-10-16 23:05:24 +08:00
.map_size(10 * 1024 * 1024 * 1024) // 10GB
.max_dbs(3000)
.open(path)?;
2019-10-16 23:05:24 +08:00
let common_store = env.create_dyn_database(Some("common"))?;
let indexes_store = env.create_database::<Str, Unit>(Some("indexes"))?;
// list all indexes that needs to be opened
let mut must_open = Vec::new();
2019-10-16 23:05:24 +08:00
let reader = env.read_txn()?;
for result in indexes_store.iter(&reader)? {
let (index_name, _) = result?;
must_open.push(index_name.to_owned());
}
2019-10-16 23:05:24 +08:00
reader.abort();
// open the previously aggregated indexes
let mut indexes = HashMap::new();
for index_name in must_open {
let (sender, receiver) = crossbeam_channel::bounded(100);
2019-10-16 23:05:24 +08:00
let index = match store::open(&env, &index_name, sender.clone())? {
Some(index) => index,
None => {
2019-10-18 19:05:28 +08:00
log::warn!(
"the index {} doesn't exist or has not all the databases",
index_name
);
2019-10-16 23:05:24 +08:00
continue;
2019-10-18 19:05:28 +08:00
}
2019-10-16 23:05:24 +08:00
};
2019-10-09 17:45:19 +08:00
let update_fn = Arc::new(ArcSwapFn::empty());
2019-10-16 23:05:24 +08:00
let env_clone = env.clone();
let index_clone = index.clone();
2019-10-09 17:45:19 +08:00
let update_fn_clone = update_fn.clone();
let handle = thread::spawn(move || {
2019-10-16 23:05:24 +08:00
update_awaiter(receiver, env_clone, update_fn_clone, index_clone)
2019-10-09 17:45:19 +08:00
});
// send an update notification to make sure that
2019-10-16 23:05:24 +08:00
// possible pre-boot updates are consumed
sender.send(()).unwrap();
2019-10-09 17:45:19 +08:00
let result = indexes.insert(index_name, (index, update_fn, handle));
2019-10-18 19:05:28 +08:00
assert!(
result.is_none(),
"The index should not have been already open"
);
}
2019-10-18 19:05:28 +08:00
Ok(Database {
env,
common_store,
indexes_store,
indexes: RwLock::new(indexes),
})
}
pub fn open_index(&self, name: impl AsRef<str>) -> Option<Index> {
let indexes_lock = self.indexes.read().unwrap();
match indexes_lock.get(name.as_ref()) {
Some((index, ..)) => Some(index.clone()),
None => None,
}
}
pub fn create_index(&self, name: impl AsRef<str>) -> MResult<Index> {
let name = name.as_ref();
let mut indexes_lock = self.indexes.write().unwrap();
match indexes_lock.entry(name.to_owned()) {
Entry::Occupied(_) => Err(crate::Error::IndexAlreadyExists),
Entry::Vacant(entry) => {
let (sender, receiver) = crossbeam_channel::bounded(100);
2019-10-16 23:05:24 +08:00
let index = store::create(&self.env, name, sender)?;
2019-10-16 23:05:24 +08:00
let mut writer = self.env.write_txn()?;
self.indexes_store.put(&mut writer, name, &())?;
2019-10-09 17:45:19 +08:00
2019-10-16 23:05:24 +08:00
let env_clone = self.env.clone();
let index_clone = index.clone();
2019-10-09 17:45:19 +08:00
let no_update_fn = Arc::new(ArcSwapFn::empty());
let no_update_fn_clone = no_update_fn.clone();
2019-10-09 17:45:19 +08:00
let handle = thread::spawn(move || {
2019-10-16 23:05:24 +08:00
update_awaiter(receiver, env_clone, no_update_fn_clone, index_clone)
});
writer.commit()?;
entry.insert((index.clone(), no_update_fn, handle));
Ok(index)
}
}
}
pub fn set_update_callback(&self, name: impl AsRef<str>, update_fn: BoxUpdateFn) -> bool {
let indexes_lock = self.indexes.read().unwrap();
match indexes_lock.get(name.as_ref()) {
Some((_, current_update_fn, _)) => {
let update_fn = Some(Arc::new(update_fn));
current_update_fn.swap(update_fn);
true
2019-10-18 19:05:28 +08:00
}
None => false,
}
}
pub fn unset_update_callback(&self, name: impl AsRef<str>) -> bool {
let indexes_lock = self.indexes.read().unwrap();
match indexes_lock.get(name.as_ref()) {
2019-10-18 19:05:28 +08:00
Some((_, current_update_fn, _)) => {
current_update_fn.swap(None);
true
}
None => false,
}
}
pub fn copy_and_compact_to_path<P: AsRef<Path>>(&self, path: P) -> ZResult<File> {
self.env.copy_to_path(path, CompactionOption::Enabled)
}
pub fn indexes_names(&self) -> MResult<Vec<String>> {
let indexes = self.indexes.read().unwrap();
Ok(indexes.keys().cloned().collect())
}
2019-10-21 18:05:53 +08:00
pub fn common_store(&self) -> heed::PolyDatabase {
2019-10-10 21:14:32 +08:00
self.common_store
}
}