2021-08-23 18:41:48 +02:00
|
|
|
use std::fs::File;
|
|
|
|
use std::io;
|
|
|
|
|
|
|
|
use concat_arrays::concat_arrays;
|
|
|
|
|
|
|
|
use super::helpers::{create_writer, writer_into_reader, GrenadParameters};
|
2021-09-02 15:57:40 +02:00
|
|
|
use crate::{FieldId, InternalError, Result, UserError};
|
2021-08-23 18:41:48 +02:00
|
|
|
|
|
|
|
/// Extracts the geographical coordinates contained in each document under the `_geo` field.
|
|
|
|
///
|
|
|
|
/// Returns the generated grenad reader containing the docid as key associated to the (latitude, longitude)
|
2022-02-16 15:28:48 +01:00
|
|
|
pub fn extract_geo_points<R: io::Read + io::Seek>(
|
|
|
|
obkv_documents: grenad::Reader<R>,
|
2021-08-23 18:41:48 +02:00
|
|
|
indexer: GrenadParameters,
|
2021-09-02 15:57:40 +02:00
|
|
|
primary_key_id: FieldId,
|
2022-03-23 17:28:41 +01:00
|
|
|
(lat_fid, lng_fid): (FieldId, FieldId),
|
2021-08-23 18:41:48 +02:00
|
|
|
) -> Result<grenad::Reader<File>> {
|
2022-02-16 15:28:48 +01:00
|
|
|
let mut writer = create_writer(
|
|
|
|
indexer.chunk_compression_type,
|
|
|
|
indexer.chunk_compression_level,
|
|
|
|
tempfile::tempfile()?,
|
|
|
|
);
|
2021-08-23 18:41:48 +02:00
|
|
|
|
2022-02-16 15:28:48 +01:00
|
|
|
let mut cursor = obkv_documents.into_cursor()?;
|
|
|
|
while let Some((docid_bytes, value)) = cursor.move_on_next()? {
|
2021-08-23 18:41:48 +02:00
|
|
|
let obkv = obkv::KvReader::new(value);
|
2022-03-23 17:28:41 +01:00
|
|
|
let (lat, lng) = obkv.get(lat_fid).zip(obkv.get(lng_fid)).ok_or_else(|| {
|
2021-09-08 18:12:10 +02:00
|
|
|
let primary_key = obkv.get(primary_key_id).unwrap();
|
2022-03-23 17:28:41 +01:00
|
|
|
let primary_key = serde_json::from_slice(primary_key).unwrap();
|
|
|
|
UserError::InvalidGeoField { document_id: primary_key }
|
|
|
|
})?;
|
|
|
|
let (lat, lng): (f64, f64) = (
|
|
|
|
serde_json::from_slice(lat).map_err(InternalError::SerdeJson)?,
|
|
|
|
serde_json::from_slice(lng).map_err(InternalError::SerdeJson)?,
|
|
|
|
);
|
|
|
|
|
|
|
|
let bytes: [u8; 16] = concat_arrays![lat.to_ne_bytes(), lng.to_ne_bytes()];
|
|
|
|
writer.insert(docid_bytes, bytes)?;
|
2021-08-23 18:41:48 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
Ok(writer_into_reader(writer)?)
|
|
|
|
}
|