meilisearch/milli/src/search/new/mod.rs

mod db_cache;
mod distinct;
mod graph_based_ranking_rule;
mod interner;
mod logger;
mod query_graph;
mod query_term;
mod ranking_rule_graph;
mod ranking_rules;
mod resolve_query_graph;
// TODO: documentation + comments
mod small_bitmap;
// TODO: documentation + comments
mod sort;
// TODO: documentation + comments
mod words;

// #[cfg(test)]
use std::collections::{BTreeSet, HashSet};

use charabia::Tokenize;
use db_cache::DatabaseCache;
use graph_based_ranking_rule::{Proximity, Typo};
use heed::RoTxn;
use interner::DedupInterner;
pub use logger::detailed::DetailedSearchLogger;
pub use logger::{DefaultSearchLogger, SearchLogger};
use query_graph::{QueryGraph, QueryNode, QueryNodeData};
use query_term::{located_query_terms_from_string, Phrase, QueryTerm};
use ranking_rules::{bucket_sort, PlaceholderQuery, RankingRuleOutput, RankingRuleQueryTrait};
use resolve_query_graph::{resolve_query_graph, QueryTermDocIdsCache};
use roaring::RoaringBitmap;
use words::Words;

use self::ranking_rules::RankingRule;
use crate::{Filter, Index, MatchingWords, Result, Search, SearchResult, TermsMatchingStrategy};

/// A structure used throughout the execution of a search query.
pub struct SearchContext<'ctx> {
    pub index: &'ctx Index,
    pub txn: &'ctx RoTxn<'ctx>,
    pub db_cache: DatabaseCache<'ctx>,
    pub word_interner: DedupInterner<String>,
    pub phrase_interner: DedupInterner<Phrase>,
    pub term_interner: DedupInterner<QueryTerm>,
    pub term_docids: QueryTermDocIdsCache,
}
impl<'ctx> SearchContext<'ctx> {
    pub fn new(index: &'ctx Index, txn: &'ctx RoTxn<'ctx>) -> Self {
        Self {
            index,
            txn,
            db_cache: <_>::default(),
            word_interner: <_>::default(),
            phrase_interner: <_>::default(),
            term_interner: <_>::default(),
            term_docids: <_>::default(),
        }
    }
}

/// Apply the [`TermsMatchingStrategy`] to the query graph and resolve it.
#[allow(clippy::too_many_arguments)]
fn resolve_maximally_reduced_query_graph<'ctx>(
    ctx: &mut SearchContext<'ctx>,
    universe: &RoaringBitmap,
    query_graph: &QueryGraph,
    matching_strategy: TermsMatchingStrategy,
    logger: &mut dyn SearchLogger<QueryGraph>,
) -> Result<RoaringBitmap> {
    let mut graph = query_graph.clone();
    let mut positions_to_remove = match matching_strategy {
        TermsMatchingStrategy::Last => {
            let mut all_positions = BTreeSet::new();
            for (_, n) in query_graph.nodes.iter() {
                match &n.data {
                    QueryNodeData::Term(term) => {
                        all_positions.extend(term.positions.clone().into_iter());
                    }
                    QueryNodeData::Deleted | QueryNodeData::Start | QueryNodeData::End => {}
                }
            }
            all_positions.into_iter().collect()
        }
        TermsMatchingStrategy::All => vec![],
    };
    // don't remove the first term
    if !positions_to_remove.is_empty() {
        positions_to_remove.remove(0);
    }
    loop {
        if positions_to_remove.is_empty() {
            break;
        } else {
            let position_to_remove = positions_to_remove.pop().unwrap();
            let _ = graph.remove_words_starting_at_position(position_to_remove);
        }
    }
    logger.query_for_universe(&graph);
    let docids = resolve_query_graph(ctx, &graph, universe)?;

    Ok(docids)
}

/// Return the list of initialised ranking rules to be used for a placeholder search.
fn get_ranking_rules_for_placeholder_search<'ctx>(
    ctx: &SearchContext<'ctx>,
) -> Result<Vec<Box<dyn RankingRule<'ctx, PlaceholderQuery>>>> {
    // let sort = false;
    // let mut asc = HashSet::new();
    // let mut desc = HashSet::new();
    let /*mut*/ ranking_rules: Vec<Box<dyn RankingRule<PlaceholderQuery>>> = vec![];
    let settings_ranking_rules = ctx.index.criteria(ctx.txn)?;
    for rr in settings_ranking_rules {
        // Add Words before any of: typo, proximity, attribute, exactness
        match rr {
            crate::Criterion::Words
            | crate::Criterion::Typo
            | crate::Criterion::Attribute
            | crate::Criterion::Proximity
            | crate::Criterion::Exactness => continue,
            crate::Criterion::Sort => todo!(),
            crate::Criterion::Asc(_) => todo!(),
            crate::Criterion::Desc(_) => todo!(),
        }
    }
    Ok(ranking_rules)
}

/// Return the list of initialised ranking rules to be used for a query graph search.
fn get_ranking_rules_for_query_graph_search<'ctx>(
    ctx: &SearchContext<'ctx>,
    terms_matching_strategy: TermsMatchingStrategy,
) -> Result<Vec<Box<dyn RankingRule<'ctx, QueryGraph>>>> {
    // query graph search
    let mut words = false;
    let mut typo = false;
    let mut proximity = false;
    let sort = false;
    let attribute = false;
    let exactness = false;
    let mut asc = HashSet::new();
    let mut desc = HashSet::new();

    let mut ranking_rules: Vec<Box<dyn RankingRule<QueryGraph>>> = vec![];
    let settings_ranking_rules = ctx.index.criteria(ctx.txn)?;
    for rr in settings_ranking_rules {
        // Add Words before any of: typo, proximity, attribute, exactness
        match rr {
            crate::Criterion::Typo
            | crate::Criterion::Attribute
            | crate::Criterion::Proximity
            // TODO: no exactness
            | crate::Criterion::Exactness => {
                if !words {
                    ranking_rules.push(Box::new(Words::new(terms_matching_strategy)));
                    words = true;
                }
            }
            _ => {}
        }
        match rr {
            crate::Criterion::Words => {
                if words {
                    continue;
                }
                ranking_rules.push(Box::new(Words::new(terms_matching_strategy)));
                words = true;
            }
            crate::Criterion::Typo => {
                if typo {
                    continue;
                }
                typo = true;
                ranking_rules.push(Box::<Typo>::default());
            }
            crate::Criterion::Proximity => {
                if proximity {
                    continue;
                }
                proximity = true;
                ranking_rules.push(Box::<Proximity>::default());
            }
            crate::Criterion::Attribute => {
                if attribute {
                    continue;
                }
                // todo!();
                // attribute = false;
            }
            crate::Criterion::Sort => {
                if sort {
                    continue;
                }
                // todo!();
                // sort = false;
            }
            crate::Criterion::Exactness => {
                if exactness {
                    continue;
                }
                // todo!();
                // exactness = false;
            }
            crate::Criterion::Asc(field) => {
                if asc.contains(&field) {
                    continue;
                }
                asc.insert(field);
                // TODO
            }
            crate::Criterion::Desc(field) => {
                if desc.contains(&field) {
                    continue;
                }
                desc.insert(field);
                // todo!();
            }
        }
    }
    Ok(ranking_rules)
}

#[allow(clippy::too_many_arguments)]
pub fn execute_search<'ctx>(
    ctx: &mut SearchContext<'ctx>,
    query: &str,
    terms_matching_strategy: TermsMatchingStrategy,
    filters: Option<Filter>,
    from: usize,
    length: usize,
    placeholder_search_logger: &mut dyn SearchLogger<PlaceholderQuery>,
    query_graph_logger: &mut dyn SearchLogger<QueryGraph>,
) -> Result<SearchResult> {
    assert!(!query.is_empty());
    let query_terms = located_query_terms_from_string(ctx, query.tokenize(), None)?;
    let graph = QueryGraph::from_query(ctx, query_terms)?;

    let mut universe = if let Some(filters) = filters {
        filters.evaluate(ctx.txn, ctx.index)?
    } else {
        ctx.index.documents_ids(ctx.txn)?
    };

    // TODO: other way to tell whether it is a placeholder search
    // This way of doing things is not correct because if someone searches
    // for a word that does not appear in any document, the word will be removed
    // from the graph and thus its number of nodes will be == 2
    // But in that case, we should return no results.
    //
    // The search is a placeholder search only if there are no tokens?
    let documents_ids = if graph.nodes.len() > 2 {
        universe = resolve_maximally_reduced_query_graph(
            ctx,
            &universe,
            &graph,
            terms_matching_strategy,
            query_graph_logger,
        )?;

        let ranking_rules = get_ranking_rules_for_query_graph_search(ctx, terms_matching_strategy)?;
        bucket_sort(ctx, ranking_rules, &graph, &universe, from, length, query_graph_logger)?
    } else {
        let ranking_rules = get_ranking_rules_for_placeholder_search(ctx)?;
        bucket_sort(
            ctx,
            ranking_rules,
            &PlaceholderQuery,
            &universe,
            from,
            length,
            placeholder_search_logger,
        )?
    };

    Ok(SearchResult {
        // TODO: correct matching words
        matching_words: MatchingWords::default(),
        // TODO: candidates with distinct
        candidates: universe,
        documents_ids,
    })
}

impl<'a> Search<'a> {
    // TODO
    pub fn execute_new(&self) -> Result<SearchResult> {
        todo!()
    }
}
Fix code visibility issue + unimplemented detail in proximity rule 2023-03-06 03:07:37 +08:00			`mod db_cache;`
Implement distinct attribute 2023-03-09 22:20:29 +08:00			`mod distinct;`
Fix code visibility issue + unimplemented detail in proximity rule 2023-03-06 03:07:37 +08:00			`mod graph_based_ranking_rule;`
Intern all strings and phrases in the search logic 2023-03-07 02:21:55 +08:00			`mod interner;`
Fix code visibility issue + unimplemented detail in proximity rule 2023-03-06 03:07:37 +08:00			`mod logger;`
			`mod query_graph;`
			`mod query_term;`
			`mod ranking_rule_graph;`
			`mod ranking_rules;`
			`mod resolve_query_graph;`
Intern more values 2023-03-09 18:12:31 +08:00			`// TODO: documentation + comments`
Apply a few optimisations for graph-based ranking rules 2023-03-07 21:42:58 +08:00			`mod small_bitmap;`
Intern more values 2023-03-09 18:12:31 +08:00			`// TODO: documentation + comments`
Fix code visibility issue + unimplemented detail in proximity rule 2023-03-06 03:07:37 +08:00			`mod sort;`
Intern more values 2023-03-09 18:12:31 +08:00			`// TODO: documentation + comments`
Fix code visibility issue + unimplemented detail in proximity rule 2023-03-06 03:07:37 +08:00			`mod words;`
Introduce a new search module, eventually meant to replace the old one The code here does not compile, because I am merely splitting one giant commit into smaller ones where each commit explains a single file. 2023-02-21 16:41:58 +08:00
WIP 2023-03-18 22:04:34 +08:00			`// #[cfg(test)]`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`use std::collections::{BTreeSet, HashSet};`
Cargo fmt 2023-03-08 16:55:53 +08:00
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`use charabia::Tokenize;`
			`use db_cache::DatabaseCache;`
WIP 2023-03-18 22:04:34 +08:00			`use graph_based_ranking_rule::{Proximity, Typo};`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`use heed::RoTxn;`
WIP 2023-03-18 22:04:34 +08:00			`use interner::DedupInterner;`
Cargo fmt 2023-03-19 22:15:58 +08:00			`pub use logger::detailed::DetailedSearchLogger;`
			`pub use logger::{DefaultSearchLogger, SearchLogger};`
WIP 2023-03-18 22:04:34 +08:00			`use query_graph::{QueryGraph, QueryNode, QueryNodeData};`
			`use query_term::{located_query_terms_from_string, Phrase, QueryTerm};`
			`use ranking_rules::{bucket_sort, PlaceholderQuery, RankingRuleOutput, RankingRuleQueryTrait};`
			`use resolve_query_graph::{resolve_query_graph, QueryTermDocIdsCache};`
Apply a few optimisations for graph-based ranking rules 2023-03-07 21:42:58 +08:00			`use roaring::RoaringBitmap;`
WIP 2023-03-18 22:04:34 +08:00			`use words::Words;`
Cargo fmt 2023-03-08 16:55:53 +08:00
WIP 2023-03-18 22:04:34 +08:00			`use self::ranking_rules::RankingRule;`
Cargo fmt 2023-03-19 22:15:58 +08:00			`use crate::{Filter, Index, MatchingWords, Result, Search, SearchResult, TermsMatchingStrategy};`
Introduce a new search module, eventually meant to replace the old one The code here does not compile, because I am merely splitting one giant commit into smaller ones where each commit explains a single file. 2023-02-21 16:41:58 +08:00
Replace EdgeCondition with an Option<..> + other code cleanup 2023-03-16 18:52:51 +08:00			`/// A structure used throughout the execution of a search query.`
Rename lifetime 2023-03-13 21:03:48 +08:00			`pub struct SearchContext<'ctx> {`
			`pub index: &'ctx Index,`
			`pub txn: &'ctx RoTxn<'ctx>,`
			`pub db_cache: DatabaseCache<'ctx>,`
Refactor of the Interner 2023-03-14 23:37:47 +08:00			`pub word_interner: DedupInterner<String>,`
			`pub phrase_interner: DedupInterner<Phrase>,`
			`pub term_interner: DedupInterner<QueryTerm>,`
Merge Phrase and WordDerivations into one structure 2023-03-14 17:54:55 +08:00			`pub term_docids: QueryTermDocIdsCache,`
Intern all strings and phrases in the search logic 2023-03-07 02:21:55 +08:00			`}`
Rename lifetime 2023-03-13 21:03:48 +08:00			`impl<'ctx> SearchContext<'ctx> {`
			`pub fn new(index: &'ctx Index, txn: &'ctx RoTxn<'ctx>) -> Self {`
Intern all strings and phrases in the search logic 2023-03-07 02:21:55 +08:00			`Self {`
			`index,`
			`txn,`
			`db_cache: <_>::default(),`
			`word_interner: <_>::default(),`
			`phrase_interner: <_>::default(),`
Merge Phrase and WordDerivations into one structure 2023-03-14 17:54:55 +08:00			`term_interner: <_>::default(),`
			`term_docids: <_>::default(),`
Intern all strings and phrases in the search logic 2023-03-07 02:21:55 +08:00			`}`
			`}`
			`}`

Replace EdgeCondition with an Option<..> + other code cleanup 2023-03-16 18:52:51 +08:00			/// Apply the [`TermsMatchingStrategy`] to the query graph and resolve it.
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`#[allow(clippy::too_many_arguments)]`
Rename lifetime 2023-03-13 21:03:48 +08:00			`fn resolve_maximally_reduced_query_graph<'ctx>(`
			`ctx: &mut SearchContext<'ctx>,`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`universe: &RoaringBitmap,`
			`query_graph: &QueryGraph,`
			`matching_strategy: TermsMatchingStrategy,`
			`logger: &mut dyn SearchLogger<QueryGraph>,`
			`) -> Result<RoaringBitmap> {`
			`let mut graph = query_graph.clone();`
			`let mut positions_to_remove = match matching_strategy {`
			`TermsMatchingStrategy::Last => {`
			`let mut all_positions = BTreeSet::new();`
Refactor of the Interner 2023-03-14 23:37:47 +08:00			`for (_, n) in query_graph.nodes.iter() {`
			`match &n.data {`
			`QueryNodeData::Term(term) => {`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`all_positions.extend(term.positions.clone().into_iter());`
			`}`
Refactor of the Interner 2023-03-14 23:37:47 +08:00			`QueryNodeData::Deleted \| QueryNodeData::Start \| QueryNodeData::End => {}`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`}`
			`}`
			`all_positions.into_iter().collect()`
			`}`
			`TermsMatchingStrategy::All => vec![],`
			`};`
			`// don't remove the first term`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`if !positions_to_remove.is_empty() {`
			`positions_to_remove.remove(0);`
			`}`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`loop {`
			`if positions_to_remove.is_empty() {`
			`break;`
			`} else {`
			`let position_to_remove = positions_to_remove.pop().unwrap();`
Add documentation 2023-03-08 20:26:29 +08:00			`let _ = graph.remove_words_starting_at_position(position_to_remove);`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`}`
			`}`
			`logger.query_for_universe(&graph);`
Intern all strings and phrases in the search logic 2023-03-07 02:21:55 +08:00			`let docids = resolve_query_graph(ctx, &graph, universe)?;`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00
			`Ok(docids)`
			`}`
Replace EdgeCondition with an Option<..> + other code cleanup 2023-03-16 18:52:51 +08:00
			`/// Return the list of initialised ranking rules to be used for a placeholder search.`
Rename lifetime 2023-03-13 21:03:48 +08:00			`fn get_ranking_rules_for_placeholder_search<'ctx>(`
			`ctx: &SearchContext<'ctx>,`
			`) -> Result<Vec<Box<dyn RankingRule<'ctx, PlaceholderQuery>>>> {`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`// let sort = false;`
			`// let mut asc = HashSet::new();`
			`// let mut desc = HashSet::new();`
			`let /mut/ ranking_rules: Vec<Box<dyn RankingRule<PlaceholderQuery>>> = vec![];`
			`let settings_ranking_rules = ctx.index.criteria(ctx.txn)?;`
			`for rr in settings_ranking_rules {`
			`// Add Words before any of: typo, proximity, attribute, exactness`
			`match rr {`
			`crate::Criterion::Words`
			`\| crate::Criterion::Typo`
			`\| crate::Criterion::Attribute`
			`\| crate::Criterion::Proximity`
			`\| crate::Criterion::Exactness => continue,`
			`crate::Criterion::Sort => todo!(),`
			`crate::Criterion::Asc(_) => todo!(),`
			`crate::Criterion::Desc(_) => todo!(),`
			`}`
			`}`
			`Ok(ranking_rules)`
			`}`
Replace EdgeCondition with an Option<..> + other code cleanup 2023-03-16 18:52:51 +08:00
			`/// Return the list of initialised ranking rules to be used for a query graph search.`
Rename lifetime 2023-03-13 21:03:48 +08:00			`fn get_ranking_rules_for_query_graph_search<'ctx>(`
			`ctx: &SearchContext<'ctx>,`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`terms_matching_strategy: TermsMatchingStrategy,`
Rename lifetime 2023-03-13 21:03:48 +08:00			`) -> Result<Vec<Box<dyn RankingRule<'ctx, QueryGraph>>>> {`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`// query graph search`
			`let mut words = false;`
			`let mut typo = false;`
			`let mut proximity = false;`
			`let sort = false;`
			`let attribute = false;`
			`let exactness = false;`
			`let mut asc = HashSet::new();`
			`let mut desc = HashSet::new();`

			`let mut ranking_rules: Vec<Box<dyn RankingRule<QueryGraph>>> = vec![];`
			`let settings_ranking_rules = ctx.index.criteria(ctx.txn)?;`
			`for rr in settings_ranking_rules {`
			`// Add Words before any of: typo, proximity, attribute, exactness`
			`match rr {`
			`crate::Criterion::Typo`
			`\| crate::Criterion::Attribute`
			`\| crate::Criterion::Proximity`
WIP 2023-03-22 21:43:08 +08:00			`// TODO: no exactness`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`\| crate::Criterion::Exactness => {`
			`if !words {`
			`ranking_rules.push(Box::new(Words::new(terms_matching_strategy)));`
			`words = true;`
			`}`
			`}`
			`_ => {}`
			`}`
			`match rr {`
			`crate::Criterion::Words => {`
			`if words {`
			`continue;`
			`}`
			`ranking_rules.push(Box::new(Words::new(terms_matching_strategy)));`
			`words = true;`
			`}`
			`crate::Criterion::Typo => {`
			`if typo {`
			`continue;`
			`}`
			`typo = true;`
			`ranking_rules.push(Box::<Typo>::default());`
			`}`
			`crate::Criterion::Proximity => {`
			`if proximity {`
			`continue;`
			`}`
			`proximity = true;`
			`ranking_rules.push(Box::<Proximity>::default());`
			`}`
			`crate::Criterion::Attribute => {`
			`if attribute {`
			`continue;`
			`}`
WIP 2023-03-23 16:12:35 +08:00			`// todo!();`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`// attribute = false;`
			`}`
			`crate::Criterion::Sort => {`
			`if sort {`
			`continue;`
			`}`
WIP 2023-03-23 16:12:35 +08:00			`// todo!();`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`// sort = false;`
			`}`
			`crate::Criterion::Exactness => {`
			`if exactness {`
			`continue;`
			`}`
WIP 2023-03-23 16:12:35 +08:00			`// todo!();`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`// exactness = false;`
			`}`
			`crate::Criterion::Asc(field) => {`
			`if asc.contains(&field) {`
			`continue;`
			`}`
			`asc.insert(field);`
Refactor of the Interner 2023-03-14 23:37:47 +08:00			`// TODO`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`}`
			`crate::Criterion::Desc(field) => {`
			`if desc.contains(&field) {`
			`continue;`
			`}`
			`desc.insert(field);`
WIP 2023-03-23 16:12:35 +08:00			`// todo!();`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`}`
			`}`
			`}`
			`Ok(ranking_rules)`
			`}`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00
			`#[allow(clippy::too_many_arguments)]`
Rename lifetime 2023-03-13 21:03:48 +08:00			`pub fn execute_search<'ctx>(`
			`ctx: &mut SearchContext<'ctx>,`
Introduce a new search module, eventually meant to replace the old one The code here does not compile, because I am merely splitting one giant commit into smaller ones where each commit explains a single file. 2023-02-21 16:41:58 +08:00			`query: &str,`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`terms_matching_strategy: TermsMatchingStrategy,`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`filters: Option<Filter>,`
			`from: usize,`
			`length: usize,`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`placeholder_search_logger: &mut dyn SearchLogger<PlaceholderQuery>,`
			`query_graph_logger: &mut dyn SearchLogger<QueryGraph>,`
WIP 2023-03-18 22:04:34 +08:00			`) -> Result<SearchResult> {`
Introduce a new search module, eventually meant to replace the old one The code here does not compile, because I am merely splitting one giant commit into smaller ones where each commit explains a single file. 2023-02-21 16:41:58 +08:00			`assert!(!query.is_empty());`
Apply a few optimisations for graph-based ranking rules 2023-03-07 21:42:58 +08:00			`let query_terms = located_query_terms_from_string(ctx, query.tokenize(), None)?;`
Intern all strings and phrases in the search logic 2023-03-07 02:21:55 +08:00			`let graph = QueryGraph::from_query(ctx, query_terms)?;`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00
WIP 2023-03-18 22:04:34 +08:00			`let mut universe = if let Some(filters) = filters {`
Intern all strings and phrases in the search logic 2023-03-07 02:21:55 +08:00			`filters.evaluate(ctx.txn, ctx.index)?`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`} else {`
Intern all strings and phrases in the search logic 2023-03-07 02:21:55 +08:00			`ctx.index.documents_ids(ctx.txn)?`
Fix: computation of initial universe, code organisation 2023-03-06 15:35:01 +08:00			`};`

Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`// TODO: other way to tell whether it is a placeholder search`
			`// This way of doing things is not correct because if someone searches`
			`// for a word that does not appear in any document, the word will be removed`
			`// from the graph and thus its number of nodes will be == 2`
			`// But in that case, we should return no results.`
			`//`
			`// The search is a placeholder search only if there are no tokens?`
WIP 2023-03-18 22:04:34 +08:00			`let documents_ids = if graph.nodes.len() > 2 {`
			`universe = resolve_maximally_reduced_query_graph(`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`ctx,`
			`&universe,`
			`&graph,`
			`terms_matching_strategy,`
			`query_graph_logger,`
			`)?;`

			`let ranking_rules = get_ranking_rules_for_query_graph_search(ctx, terms_matching_strategy)?;`
WIP 2023-03-18 22:04:34 +08:00			`bucket_sort(ctx, ranking_rules, &graph, &universe, from, length, query_graph_logger)?`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`} else {`
			`let ranking_rules = get_ranking_rules_for_placeholder_search(ctx)?;`
			`bucket_sort(`
			`ctx,`
			`ranking_rules,`
			`&PlaceholderQuery,`
			`&universe,`
			`from,`
			`length,`
			`placeholder_search_logger,`
WIP 2023-03-18 22:04:34 +08:00			`)?`
			`};`

			`Ok(SearchResult {`
			`// TODO: correct matching words`
			`matching_words: MatchingWords::default(),`
			`// TODO: candidates with distinct`
			`candidates: universe,`
			`documents_ids,`
			`})`
			`}`

			`impl<'a> Search<'a> {`
			`// TODO`
			`pub fn execute_new(&self) -> Result<SearchResult> {`
			`todo!()`
Reorganise initialisation of ranking rules + rename PathsMap -> PathSet 2023-03-13 16:52:17 +08:00			`}`
Intern more values 2023-03-09 18:12:31 +08:00			`}`