meilisearch/milli/src/documents/builder.rs

use std::collections::BTreeMap;
use std::io;
use std::io::Cursor;
use std::io::Write;

use byteorder::{BigEndian, WriteBytesExt};
use serde::Deserializer;
use serde_json::Value;

use crate::FieldId;

use super::serde::DocumentVisitor;
use super::{ByteCounter, DocumentsBatchIndex, DocumentsMetadata, Error};

/// The `DocumentsBatchBuilder` provides a way to build a documents batch in the intermediary
/// format used by milli.
///
/// The writer used by the DocumentBatchBuilder can be read using a `DocumentBatchReader` to
/// iterate other the documents.
pub struct DocumentBatchBuilder<W> {
    inner: ByteCounter<W>,
    index: DocumentsBatchIndex,
    obkv_buffer: Vec<u8>,
    value_buffer: Vec<u8>,
    values: BTreeMap<FieldId, Value>,
    count: usize,
}

impl<W: io::Write + io::Seek> DocumentBatchBuilder<W> {
    pub fn new(writer: W) -> Result<Self, Error> {
        let index = DocumentsBatchIndex::default();
        let mut writer = ByteCounter::new(writer);
        // add space to write the offset of the metadata at the end of the writer
        writer.write_u64::<BigEndian>(0)?;

        let this = Self {
            inner: writer,
            index,
            obkv_buffer: Vec::new(),
            value_buffer: Vec::new(),
            values: BTreeMap::new(),
            count: 0,
        };

        Ok(this)
    }

    /// Returns the number of documents that have been written to the builder.
    pub fn len(&self) -> usize {
        self.count
    }

    /// This method must be called after the document addition is terminated. It will put the
    /// metadata at the end of the file, and write the metadata offset at the beginning on the
    /// file.
    pub fn finish(self) -> Result<(), Error> {
        let Self {
            inner: ByteCounter { mut writer, count: offset },
            index,
            count,
            ..
        } = self;

        let meta = DocumentsMetadata { count, index };

        bincode::serialize_into(&mut writer, &meta)?;

        writer.seek(io::SeekFrom::Start(0))?;
        writer.write_u64::<BigEndian>(offset as u64)?;

        writer.flush()?;

        Ok(())
    }


    /// Extends the builder with json documents from a reader.
    pub fn extend_from_json<R: io::Read>(&mut self, reader: R) -> Result<(), Error> {
        let mut de = serde_json::Deserializer::from_reader(reader);

        let mut visitor = DocumentVisitor {
            inner: &mut self.inner,
            index: &mut self.index,
            obkv_buffer: &mut self.obkv_buffer,
            value_buffer: &mut self.value_buffer,
            values: &mut self.values,
            count: &mut self.count,
        };

        de.deserialize_any(&mut visitor).map_err(Error::JsonError)?;

        Ok(())
    }

    /// Extends the builder with json documents from a reader.
    ///
    /// This method can be only called once and is mutually exclusive with extend from json. This
    /// is because the fields in a csv are always guaranteed to come in order, and permits some
    /// optimizations.
    ///
    /// From csv takes care to call finish in the end.
    pub fn from_csv<R: io::Read>(reader: R, writer: W) -> Result<Self, Error> {

        let mut this = Self::new(writer)?;
        // Ensure that this is the first and only addition made with this builder
        debug_assert!(this.index.is_empty());

        let mut records = csv::Reader::from_reader(reader);

        let headers = records
            .headers()
            .unwrap()
            .into_iter()
            .map(parse_csv_header)
            .map(|(k, t)| (this.index.insert(&k), t))
            .collect::<BTreeMap<_, _>>();

        let records = records.into_records();

        for record in records {
            match record {
                Ok(record) => {
                    let mut writer = obkv::KvWriter::new(Cursor::new(&mut this.obkv_buffer));
                    for (value, (fid, ty)) in record.into_iter().zip(headers.iter()) {
                        let value = match ty {
                            AllowedType::Number => value.parse::<f64>().map(Value::from).unwrap(),
                            AllowedType::String => Value::String(value.to_string()),
                        };

                        serde_json::to_writer(Cursor::new(&mut this.value_buffer), &value).unwrap();
                        writer.insert(*fid, &this.value_buffer)?;
                        this.value_buffer.clear();
                    }

                    this.inner.write_u32::<BigEndian>(this.obkv_buffer.len() as u32)?;
                    this.inner.write_all(&this.obkv_buffer)?;

                    this.obkv_buffer.clear();
                    this.count += 1;
                },
                Err(_) => panic!(),
            }
        }

        Ok(this)
    }
}

#[derive(Debug)]
enum AllowedType {
    String,
    Number,
}

fn parse_csv_header(header: &str) -> (String, AllowedType) {
    // if there are several separators we only split on the last one.
    match header.rsplit_once(':') {
        Some((field_name, field_type)) => match field_type {
            "string" => (field_name.to_string(), AllowedType::String),
            "number" => (field_name.to_string(), AllowedType::Number), // if the pattern isn't reconized, we keep the whole field.
            _otherwise => (header.to_string(), AllowedType::String),
        },
        None => (header.to_string(), AllowedType::String),
    }
}

#[cfg(test)]
mod test {
    use std::io::Cursor;

    use crate::documents::DocumentBatchReader;

    use super::*;

    #[test]
    fn add_single_documents_json() {
        let mut cursor = Cursor::new(Vec::new());
        let mut builder = DocumentBatchBuilder::new(&mut cursor).unwrap();

        let json = serde_json::json!({
            "id": 1,
            "field": "hello!",
        });

        builder.extend_from_json(Cursor::new(serde_json::to_vec(&json).unwrap())).unwrap();

        let json = serde_json::json!({
            "blabla": false,
            "field": "hello!",
            "id": 1,
        });

        builder.extend_from_json(Cursor::new(serde_json::to_vec(&json).unwrap())).unwrap();

        assert_eq!(builder.len(), 2);

        builder.finish().unwrap();

        cursor.set_position(0);

        let mut reader = DocumentBatchReader::from_reader(cursor).unwrap();

        let (index, document) = reader.next_document_with_index().unwrap().unwrap();
        assert_eq!(index.len(), 3);
        assert_eq!(document.iter().count(), 2);

        let (index, document) = reader.next_document_with_index().unwrap().unwrap();
        assert_eq!(index.len(), 3);
        assert_eq!(document.iter().count(), 3);

        assert!(reader.next_document_with_index().unwrap().is_none());
    }

    #[test]
    fn add_documents_seq_json() {
        let mut cursor = Cursor::new(Vec::new());
        let mut builder = DocumentBatchBuilder::new(&mut cursor).unwrap();

        let json = serde_json::json!([{
            "id": 1,
            "field": "hello!",
        },{
            "blabla": false,
            "field": "hello!",
            "id": 1,
        }
        ]);

        builder.extend_from_json(Cursor::new(serde_json::to_vec(&json).unwrap())).unwrap();

        assert_eq!(builder.len(), 2);

        builder.finish().unwrap();

        cursor.set_position(0);

        let mut reader = DocumentBatchReader::from_reader(cursor).unwrap();

        let (index, document) = reader.next_document_with_index().unwrap().unwrap();
        assert_eq!(index.len(), 3);
        assert_eq!(document.iter().count(), 2);

        let (index, document) = reader.next_document_with_index().unwrap().unwrap();
        assert_eq!(index.len(), 3);
        assert_eq!(document.iter().count(), 3);

        assert!(reader.next_document_with_index().unwrap().is_none());
    }

    #[test]
    fn add_documents_csv() {
        let mut cursor = Cursor::new(Vec::new());

        let csv = "id:number,field:string\n1,hello!\n2,blabla";

        let builder = DocumentBatchBuilder::from_csv(Cursor::new(csv.as_bytes()), &mut cursor).unwrap();
        builder.finish().unwrap();

        cursor.set_position(0);

        let mut reader = DocumentBatchReader::from_reader(cursor).unwrap();

        let (index, document) = reader.next_document_with_index().unwrap().unwrap();
        assert_eq!(index.len(), 2);
        assert_eq!(document.iter().count(), 2);

        let (_index, document) = reader.next_document_with_index().unwrap().unwrap();
        assert_eq!(document.iter().count(), 2);

        assert!(reader.next_document_with_index().unwrap().is_none());
    }
}
optimize document deserialization 2021-10-21 03:26:52 +08:00			`use std::collections::BTreeMap;`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`use std::io;`
implement csv serialization 2021-10-21 17:05:16 +08:00			`use std::io::Cursor;`
			`use std::io::Write;`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00
			`use byteorder::{BigEndian, WriteBytesExt};`
optimize document deserialization 2021-10-21 03:26:52 +08:00			`use serde::Deserializer;`
			`use serde_json::Value;`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00
optimize document deserialization 2021-10-21 03:26:52 +08:00			`use crate::FieldId;`

			`use super::serde::DocumentVisitor;`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`use super::{ByteCounter, DocumentsBatchIndex, DocumentsMetadata, Error};`

			/// The `DocumentsBatchBuilder` provides a way to build a documents batch in the intermediary
			`/// format used by milli.`
			`///`
			/// The writer used by the DocumentBatchBuilder can be read using a `DocumentBatchReader` to
			`/// iterate other the documents.`
			`pub struct DocumentBatchBuilder<W> {`
optimize document deserialization 2021-10-21 03:26:52 +08:00			`inner: ByteCounter<W>,`
			`index: DocumentsBatchIndex,`
			`obkv_buffer: Vec<u8>,`
			`value_buffer: Vec<u8>,`
			`values: BTreeMap<FieldId, Value>,`
			`count: usize,`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`}`

			`impl<W: io::Write + io::Seek> DocumentBatchBuilder<W> {`
			`pub fn new(writer: W) -> Result<Self, Error> {`
implement csv serialization 2021-10-21 17:05:16 +08:00			`let index = DocumentsBatchIndex::default();`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`let mut writer = ByteCounter::new(writer);`
			`// add space to write the offset of the metadata at the end of the writer`
			`writer.write_u64::<BigEndian>(0)?;`

optimize document deserialization 2021-10-21 03:26:52 +08:00			`let this = Self {`
			`inner: writer,`
			`index,`
			`obkv_buffer: Vec::new(),`
			`value_buffer: Vec::new(),`
			`values: BTreeMap::new(),`
			`count: 0,`
			`};`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00
optimize document deserialization 2021-10-21 03:26:52 +08:00			`Ok(this)`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`}`

			`/// Returns the number of documents that have been written to the builder.`
			`pub fn len(&self) -> usize {`
optimize document deserialization 2021-10-21 03:26:52 +08:00			`self.count`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`}`

			`/// This method must be called after the document addition is terminated. It will put the`
			`/// metadata at the end of the file, and write the metadata offset at the beginning on the`
			`/// file.`
			`pub fn finish(self) -> Result<(), Error> {`
optimize document deserialization 2021-10-21 03:26:52 +08:00			`let Self {`
			`inner: ByteCounter { mut writer, count: offset },`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`index,`
			`count,`
			`..`
optimize document deserialization 2021-10-21 03:26:52 +08:00			`} = self;`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00
			`let meta = DocumentsMetadata { count, index };`

			`bincode::serialize_into(&mut writer, &meta)?;`

			`writer.seek(io::SeekFrom::Start(0))?;`
			`writer.write_u64::<BigEndian>(offset as u64)?;`

			`writer.flush()?;`

			`Ok(())`
			`}`

optimize document deserialization 2021-10-21 03:26:52 +08:00
			`/// Extends the builder with json documents from a reader.`
			`pub fn extend_from_json<R: io::Read>(&mut self, reader: R) -> Result<(), Error> {`
			`let mut de = serde_json::Deserializer::from_reader(reader);`

			`let mut visitor = DocumentVisitor {`
			`inner: &mut self.inner,`
			`index: &mut self.index,`
			`obkv_buffer: &mut self.obkv_buffer,`
			`value_buffer: &mut self.value_buffer,`
			`values: &mut self.values,`
			`count: &mut self.count,`
			`};`

fix tests 2021-10-24 20:41:36 +08:00			`de.deserialize_any(&mut visitor).map_err(Error::JsonError)?;`
optimize document deserialization 2021-10-21 03:26:52 +08:00
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`Ok(())`
			`}`
implement csv serialization 2021-10-21 17:05:16 +08:00
			`/// Extends the builder with json documents from a reader.`
			`///`
			`/// This method can be only called once and is mutually exclusive with extend from json. This`
			`/// is because the fields in a csv are always guaranteed to come in order, and permits some`
			`/// optimizations.`
			`///`
			`/// From csv takes care to call finish in the end.`
fix tests 2021-10-24 20:41:36 +08:00			`pub fn from_csv<R: io::Read>(reader: R, writer: W) -> Result<Self, Error> {`
implement csv serialization 2021-10-21 17:05:16 +08:00
fix tests 2021-10-24 20:41:36 +08:00			`let mut this = Self::new(writer)?;`
implement csv serialization 2021-10-21 17:05:16 +08:00			`// Ensure that this is the first and only addition made with this builder`
fix tests 2021-10-24 20:41:36 +08:00			`debug_assert!(this.index.is_empty());`
implement csv serialization 2021-10-21 17:05:16 +08:00
			`let mut records = csv::Reader::from_reader(reader);`

			`let headers = records`
			`.headers()`
			`.unwrap()`
			`.into_iter()`
			`.map(parse_csv_header)`
fix tests 2021-10-24 20:41:36 +08:00			`.map(\|(k, t)\| (this.index.insert(&k), t))`
			`.collect::<BTreeMap<_, _>>();`
implement csv serialization 2021-10-21 17:05:16 +08:00
			`let records = records.into_records();`

			`for record in records {`
			`match record {`
			`Ok(record) => {`
fix tests 2021-10-24 20:41:36 +08:00			`let mut writer = obkv::KvWriter::new(Cursor::new(&mut this.obkv_buffer));`
implement csv serialization 2021-10-21 17:05:16 +08:00			`for (value, (fid, ty)) in record.into_iter().zip(headers.iter()) {`
			`let value = match ty {`
			`AllowedType::Number => value.parse::<f64>().map(Value::from).unwrap(),`
			`AllowedType::String => Value::String(value.to_string()),`
			`};`

fix tests 2021-10-24 20:41:36 +08:00			`serde_json::to_writer(Cursor::new(&mut this.value_buffer), &value).unwrap();`
			`writer.insert(*fid, &this.value_buffer)?;`
			`this.value_buffer.clear();`
implement csv serialization 2021-10-21 17:05:16 +08:00			`}`

fix tests 2021-10-24 20:41:36 +08:00			`this.inner.write_u32::<BigEndian>(this.obkv_buffer.len() as u32)?;`
			`this.inner.write_all(&this.obkv_buffer)?;`
implement csv serialization 2021-10-21 17:05:16 +08:00
fix tests 2021-10-24 20:41:36 +08:00			`this.obkv_buffer.clear();`
			`this.count += 1;`
implement csv serialization 2021-10-21 17:05:16 +08:00			`},`
			`Err(_) => panic!(),`
			`}`
			`}`

fix tests 2021-10-24 20:41:36 +08:00			`Ok(this)`
implement csv serialization 2021-10-21 17:05:16 +08:00			`}`
			`}`

			`#[derive(Debug)]`
			`enum AllowedType {`
			`String,`
			`Number,`
			`}`

			`fn parse_csv_header(header: &str) -> (String, AllowedType) {`
			`// if there are several separators we only split on the last one.`
			`match header.rsplit_once(':') {`
			`Some((field_name, field_type)) => match field_type {`
			`"string" => (field_name.to_string(), AllowedType::String),`
			`"number" => (field_name.to_string(), AllowedType::Number), // if the pattern isn't reconized, we keep the whole field.`
			`_otherwise => (header.to_string(), AllowedType::String),`
			`},`
			`None => (header.to_string(), AllowedType::String),`
			`}`
Implement documents format document reader transform remove update format support document sequences fix document transform clean transform improve error handling add documents! macro fix transform bug fix tests remove csv dependency Add comments on the transform process replace search cli fmt review edits fix http ui fix clippy warnings Revert "fix clippy warnings" This reverts commit a1ce3cd96e603633dbf43e9e0b12b2453c9c5620. fix review comments remove smallvec in transform loop review edits 2021-08-31 17:44:15 +08:00			`}`
optimize document deserialization 2021-10-21 03:26:52 +08:00
			`#[cfg(test)]`
			`mod test {`
			`use std::io::Cursor;`

			`use crate::documents::DocumentBatchReader;`

			`use super::*;`

			`#[test]`
			`fn add_single_documents_json() {`
			`let mut cursor = Cursor::new(Vec::new());`
			`let mut builder = DocumentBatchBuilder::new(&mut cursor).unwrap();`

			`let json = serde_json::json!({`
			`"id": 1,`
			`"field": "hello!",`
			`});`

			`builder.extend_from_json(Cursor::new(serde_json::to_vec(&json).unwrap())).unwrap();`

			`let json = serde_json::json!({`
			`"blabla": false,`
			`"field": "hello!",`
			`"id": 1,`
			`});`

			`builder.extend_from_json(Cursor::new(serde_json::to_vec(&json).unwrap())).unwrap();`

			`assert_eq!(builder.len(), 2);`

			`builder.finish().unwrap();`

			`cursor.set_position(0);`

			`let mut reader = DocumentBatchReader::from_reader(cursor).unwrap();`

			`let (index, document) = reader.next_document_with_index().unwrap().unwrap();`
			`assert_eq!(index.len(), 3);`
			`assert_eq!(document.iter().count(), 2);`

			`let (index, document) = reader.next_document_with_index().unwrap().unwrap();`
			`assert_eq!(index.len(), 3);`
			`assert_eq!(document.iter().count(), 3);`

			`assert!(reader.next_document_with_index().unwrap().is_none());`
			`}`

			`#[test]`
			`fn add_documents_seq_json() {`
			`let mut cursor = Cursor::new(Vec::new());`
			`let mut builder = DocumentBatchBuilder::new(&mut cursor).unwrap();`

			`let json = serde_json::json!([{`
			`"id": 1,`
			`"field": "hello!",`
			`},{`
			`"blabla": false,`
			`"field": "hello!",`
			`"id": 1,`
			`}`
			`]);`

			`builder.extend_from_json(Cursor::new(serde_json::to_vec(&json).unwrap())).unwrap();`

			`assert_eq!(builder.len(), 2);`

			`builder.finish().unwrap();`

			`cursor.set_position(0);`

			`let mut reader = DocumentBatchReader::from_reader(cursor).unwrap();`

			`let (index, document) = reader.next_document_with_index().unwrap().unwrap();`
			`assert_eq!(index.len(), 3);`
			`assert_eq!(document.iter().count(), 2);`

			`let (index, document) = reader.next_document_with_index().unwrap().unwrap();`
			`assert_eq!(index.len(), 3);`
			`assert_eq!(document.iter().count(), 3);`

			`assert!(reader.next_document_with_index().unwrap().is_none());`
			`}`
implement csv serialization 2021-10-21 17:05:16 +08:00
			`#[test]`
			`fn add_documents_csv() {`
			`let mut cursor = Cursor::new(Vec::new());`

			`let csv = "id:number,field:string\n1,hello!\n2,blabla";`

fix tests 2021-10-24 20:41:36 +08:00			`let builder = DocumentBatchBuilder::from_csv(Cursor::new(csv.as_bytes()), &mut cursor).unwrap();`
			`builder.finish().unwrap();`
implement csv serialization 2021-10-21 17:05:16 +08:00
			`cursor.set_position(0);`

			`let mut reader = DocumentBatchReader::from_reader(cursor).unwrap();`

			`let (index, document) = reader.next_document_with_index().unwrap().unwrap();`
			`assert_eq!(index.len(), 2);`
			`assert_eq!(document.iter().count(), 2);`

			`let (_index, document) = reader.next_document_with_index().unwrap().unwrap();`
			`assert_eq!(document.iter().count(), 2);`

			`assert!(reader.next_document_with_index().unwrap().is_none());`
			`}`
optimize document deserialization 2021-10-21 03:26:52 +08:00			`}`