From c15c076da95a87db9fb62caff4308427cdfe4824 Mon Sep 17 00:00:00 2001 From: Louis Dureuil Date: Thu, 8 Jun 2023 11:30:35 +0200 Subject: [PATCH] DB BREAKING: Count the number of words in field_id_word_count_docids --- .../extract/extract_fid_word_count_docids.rs | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) diff --git a/milli/src/update/index_documents/extract/extract_fid_word_count_docids.rs b/milli/src/update/index_documents/extract/extract_fid_word_count_docids.rs index 315ebdf0c..6952eb484 100644 --- a/milli/src/update/index_documents/extract/extract_fid_word_count_docids.rs +++ b/milli/src/update/index_documents/extract/extract_fid_word_count_docids.rs @@ -1,6 +1,6 @@ use std::collections::HashMap; use std::fs::File; -use std::{cmp, io}; +use std::io; use grenad::Sorter; @@ -54,11 +54,10 @@ pub fn extract_fid_word_count_docids( } for position in read_u32_ne_bytes(value) { - let (field_id, position) = relative_from_absolute_position(position); - let word_count = position as u32 + 1; + let (field_id, _) = relative_from_absolute_position(position); let value = document_fid_wordcount.entry(field_id as FieldId).or_insert(0); - *value = cmp::max(*value, word_count); + *value += 1; } }