From 7ebd121abcf9642ec4fc0a73eafb73495e1361d5 Mon Sep 17 00:00:00 2001 From: Sarah Hoffmann Date: Wed, 9 Jul 2025 22:25:40 +0200 Subject: [PATCH] give word break slight advantage towards continuation prefers longer words --- src/nominatim_api/search/icu_tokenizer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/nominatim_api/search/icu_tokenizer.py b/src/nominatim_api/search/icu_tokenizer.py index 2bb9ce93..ef6dba28 100644 --- a/src/nominatim_api/search/icu_tokenizer.py +++ b/src/nominatim_api/search/icu_tokenizer.py @@ -42,7 +42,7 @@ PENALTY_BREAK = { qmod.BREAK_END: -0.5, qmod.BREAK_PHRASE: -0.5, qmod.BREAK_SOFT_PHRASE: -0.5, - qmod.BREAK_WORD: 0.0, + qmod.BREAK_WORD: 0.1, qmod.BREAK_PART: 0.2, qmod.BREAK_TOKEN: 0.4 } -- 2.39.5