add penalty for single words that look like stop words

This commit is contained in:
Sarah Hoffmann 2024-03-16 11:26:00 +01:00
parent 07b7fd1dbb
commit ff3230a7f3

View File

@ -226,6 +226,8 @@ class SearchBuilder:
name_fulls = self.query.get_tokens(name, TokenType.WORD)
if name_fulls:
fulls_count = sum(t.count for t in name_fulls)
if len(name_partials) == 1:
penalty += min(1, max(0, (exp_count - 50 * fulls_count) / (1000 * fulls_count)))
# At this point drop unindexed partials from the address.
# This might yield wrong results, nothing we can do about that.
if not partials_indexed: