From: Sarah Hoffmann Date: Sat, 16 Mar 2024 10:26:00 +0000 (+0100) Subject: add penalty for single words that look like stop words X-Git-Tag: deploy~7^2^2~1 X-Git-Url: https://git.openstreetmap.org/nominatim.git/commitdiff_plain/ff3230a7f3fcb314c22ab977fa014465ff274ec8 add penalty for single words that look like stop words --- diff --git a/nominatim/api/search/db_search_builder.py b/nominatim/api/search/db_search_builder.py index ef7a66b8..f8eabad1 100644 --- a/nominatim/api/search/db_search_builder.py +++ b/nominatim/api/search/db_search_builder.py @@ -226,6 +226,8 @@ class SearchBuilder: name_fulls = self.query.get_tokens(name, TokenType.WORD) if name_fulls: fulls_count = sum(t.count for t in name_fulls) + if len(name_partials) == 1: + penalty += min(1, max(0, (exp_count - 50 * fulls_count) / (1000 * fulls_count))) # At this point drop unindexed partials from the address. # This might yield wrong results, nothing we can do about that. if not partials_indexed: