adapt tests for ICU tokenizer

2026-03-12 22:04:07 +00:00 · 2021-06-06 11:00:44 +02:00
parent 8413075249
commit 2e3c5d4c5b
8 changed files with 143 additions and 67 deletions
--- a/nominatim/tokenizer/legacy_tokenizer.py
+++ b/nominatim/tokenizer/legacy_tokenizer.py
@@ -271,8 +271,7 @@ class LegacyNameAnalyzer:
            self.conn = None


-    @staticmethod
-    def get_word_token_info(conn, words):
+    def get_word_token_info(self, words):
        """ Return token information for the given list of words.
            If a word starts with # it is assumed to be a full name
            otherwise is a partial name.
@@ -283,7 +282,7 @@ class LegacyNameAnalyzer:
            The function is used for testing and debugging only
            and not necessarily efficient.
        """
-        with conn.cursor() as cur:
+        with self.conn.cursor() as cur:
            cur.execute("""SELECT t.term, word_token, word_id
                           FROM word, (SELECT unnest(%s::TEXT[]) as term) t
                           WHERE word_token = (CASE