From dc2cb58cf1ce3fa33f791d095f095c429a6ad9c0 Mon Sep 17 00:00:00 2001 From: ManyTheFish Date: Wed, 25 Sep 2024 11:12:30 +0200 Subject: [PATCH] use charabia default for all-tokenization --- milli/Cargo.toml | 12 +----------- 1 file changed, 1 insertion(+), 11 deletions(-) diff --git a/milli/Cargo.toml b/milli/Cargo.toml index 70d09ce4e..3c4a44639 100644 --- a/milli/Cargo.toml +++ b/milli/Cargo.toml @@ -98,17 +98,7 @@ rand = { version = "0.8.5", features = ["small_rng"] } [features] all-tokenizations = [ - "charabia/chinese", - "charabia/hebrew", - "charabia/japanese", - "charabia/thai", - "charabia/korean", - "charabia/greek", - "charabia/khmer", - "charabia/vietnamese", - "charabia/swedish-recomposition", - "charabia/german-segmentation", - "charabia/turkish", + "charabia/default", ] # Use POSIX semaphores instead of SysV semaphores in LMDB