use word_token length when penalizing against postcodes

2026-02-16 15:47:58 +00:00 · 2025-03-18 23:07:27 +01:00
parent 7b3c725f2a
commit 2c61fe08a0
1 changed files with 2 additions and 2 deletions
--- a/src/nominatim_api/search/icu_tokenizer.py
+++ b/src/nominatim_api/search/icu_tokenizer.py
@@ -269,10 +269,10 @@ class ICUQueryAnalyzer(AbstractQueryAnalyzer):
        """
        for i, node, tlist in query.iter_token_lists():
            if tlist.ttype == qmod.TOKEN_POSTCODE:
+                tlen = len(cast(ICUToken, tlist.tokens[0]).word_token)
                for repl in node.starting:
                    if repl.end == tlist.end and repl.ttype != qmod.TOKEN_POSTCODE \
-                       and (repl.ttype != qmod.TOKEN_HOUSENUMBER
-                            or len(tlist.tokens[0].lookup_word) > 4):
+                       and (repl.ttype != qmod.TOKEN_HOUSENUMBER or tlen > 4):
                        repl.add_penalty(0.39)
            elif (tlist.ttype == qmod.TOKEN_HOUSENUMBER
                  and len(tlist.tokens[0].lookup_word) <= 3):