Moved KANJI_MAP to global variable

This commit is contained in:
miku0
2023-07-26 21:43:22 +00:00
parent 848e5ac5de
commit fac8c32cda
2 changed files with 28 additions and 37 deletions

View File

@@ -1,36 +0,0 @@
# SPDX-License-Identifier: GPL-3.0-or-later
#
# This file is part of Nominatim. (https://nominatim.org)
#
# Copyright (C) 2022 by the Nominatim developer community.
# For a full list of authors see the git log.
"""
This is a file for a function that converts Kanji (Japanese) numerals to Arabic numerals.
"""
def convert_kanji_sequence_to_number(sequence: str) -> str:
"""Converts Kanji numbers to Arabic numbers
"""
kanji_map = {
'': '0',
'': '1',
'': '2',
'': '3',
'': '4',
'': '5',
'': '6',
'': '7',
'': '8',
'': '9'
}
converted = ''
current_number = ''
for char in sequence:
if char in kanji_map:
current_number += kanji_map[char]
else:
converted += current_number
current_number = ''
converted += char
converted += current_number
return converted

View File

@@ -17,7 +17,34 @@ from typing import List, Optional
from nominatim.tokenizer.sanitizers.base import ProcessInfo from nominatim.tokenizer.sanitizers.base import ProcessInfo
from nominatim.tokenizer.sanitizers.config import SanitizerConfig from nominatim.tokenizer.sanitizers.config import SanitizerConfig
from nominatim.data.place_name import PlaceName from nominatim.data.place_name import PlaceName
from nominatim.tokenizer.sanitizers.kanji_utils import convert_kanji_sequence_to_number
KANJI_MAP = {
'': '0',
'': '1',
'': '2',
'': '3',
'': '4',
'': '5',
'': '6',
'': '7',
'': '8',
'': '9'
}
def convert_kanji_sequence_to_number(sequence: str) -> str:
"""Converts Kanji numbers to Arabic numbers
"""
converted = ''
current_number = ''
for char in sequence:
if char in KANJI_MAP:
current_number += KANJI_MAP[char]
else:
converted += current_number
current_number = ''
converted += char
converted += current_number
return converted
def create(_: SanitizerConfig) -> Callable[[ProcessInfo], None]: def create(_: SanitizerConfig) -> Callable[[ProcessInfo], None]:
#def create(config: SanitizerConfig) -> Callable[[ProcessInfo],None]: #def create(config: SanitizerConfig) -> Callable[[ProcessInfo],None]: