2024-09-02 10:42:19 +02:00
|
|
|
use std::sync::Arc;
|
|
|
|
|
|
|
|
use rayon::iter::{ParallelBridge, ParallelIterator};
|
|
|
|
use roaring::RoaringBitmap;
|
|
|
|
|
|
|
|
use super::Indexer;
|
|
|
|
use crate::documents::PrimaryKey;
|
|
|
|
use crate::update::new::{Deletion, DocumentChange, ItemsPool};
|
|
|
|
use crate::{FieldsIdsMap, Index, InternalError, Result};
|
|
|
|
|
2024-09-02 14:42:27 +02:00
|
|
|
pub struct DocumentDeletion {
|
2024-09-02 10:42:19 +02:00
|
|
|
pub to_delete: RoaringBitmap,
|
|
|
|
}
|
|
|
|
|
2024-09-02 14:42:27 +02:00
|
|
|
impl DocumentDeletion {
|
2024-09-02 10:42:19 +02:00
|
|
|
pub fn new() -> Self {
|
|
|
|
Self { to_delete: Default::default() }
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn delete_documents_by_docids(&mut self, docids: RoaringBitmap) {
|
|
|
|
self.to_delete |= docids;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-09-02 14:42:27 +02:00
|
|
|
impl<'p> Indexer<'p> for DocumentDeletion {
|
2024-09-02 10:42:19 +02:00
|
|
|
type Parameter = (&'p Index, &'p FieldsIdsMap, &'p PrimaryKey<'p>);
|
|
|
|
|
|
|
|
fn document_changes(
|
|
|
|
self,
|
|
|
|
param: Self::Parameter,
|
|
|
|
) -> Result<impl ParallelIterator<Item = Result<Option<DocumentChange>>> + 'p> {
|
|
|
|
let (index, fields, primary_key) = param;
|
|
|
|
let items = Arc::new(ItemsPool::new(|| index.read_txn().map_err(crate::Error::from)));
|
|
|
|
Ok(self.to_delete.into_iter().par_bridge().map_with(items, |items, docid| {
|
|
|
|
items.with(|rtxn| {
|
|
|
|
let current = index.document(rtxn, docid)?;
|
|
|
|
let external_docid = match primary_key.document_id(current, fields)? {
|
|
|
|
Ok(document_id) => Ok(document_id) as Result<_>,
|
|
|
|
Err(_) => Err(InternalError::DocumentsError(
|
|
|
|
crate::documents::Error::InvalidDocumentFormat,
|
|
|
|
)
|
|
|
|
.into()),
|
|
|
|
}?;
|
|
|
|
|
|
|
|
Ok(Some(DocumentChange::Deletion(Deletion::create(
|
|
|
|
docid,
|
|
|
|
external_docid,
|
|
|
|
current.boxed(),
|
|
|
|
))))
|
|
|
|
})
|
|
|
|
}))
|
|
|
|
}
|
|
|
|
}
|