mirror of
https://github.com/osm-search/Nominatim.git
synced 2026-02-26 11:08:13 +00:00
Introduction of SPCsvLoader to load special phrases from a csv file
This commit is contained in:
@@ -2,11 +2,12 @@
|
|||||||
Implementation of the 'special-phrases' command.
|
Implementation of the 'special-phrases' command.
|
||||||
"""
|
"""
|
||||||
import logging
|
import logging
|
||||||
from nominatim.errors import UsageError
|
|
||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
from nominatim.tools import SPWikiLoader
|
from nominatim.errors import UsageError
|
||||||
from nominatim.tools import SPImporter
|
|
||||||
from nominatim.db.connection import connect
|
from nominatim.db.connection import connect
|
||||||
|
from nominatim.tools.special_phrases.sp_importer import SPImporter
|
||||||
|
from nominatim.tools.special_phrases.sp_wiki_loader import SPWikiLoader
|
||||||
|
from nominatim.tools.special_phrases.sp_csv_loader import SPCsvLoader
|
||||||
|
|
||||||
LOG = logging.getLogger()
|
LOG = logging.getLogger()
|
||||||
|
|
||||||
@@ -24,23 +25,33 @@ class ImportSpecialPhrases:
|
|||||||
group = parser.add_argument_group('Input arguments')
|
group = parser.add_argument_group('Input arguments')
|
||||||
group.add_argument('--import-from-wiki', action='store_true',
|
group.add_argument('--import-from-wiki', action='store_true',
|
||||||
help='Import special phrases from the OSM wiki to the database.')
|
help='Import special phrases from the OSM wiki to the database.')
|
||||||
group.add_argument('--csv-file', metavar='FILE',
|
group.add_argument('--import-from-csv', metavar='FILE',
|
||||||
help='CSV file containing phrases to import.')
|
help='Import special phrases from a CSV file.')
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def run(args):
|
def run(args):
|
||||||
from ..tokenizer import factory as tokenizer_factory
|
|
||||||
|
|
||||||
if args.import_from_wiki:
|
if args.import_from_wiki:
|
||||||
tokenizer = tokenizer_factory.get_tokenizer_for_db(args.config)
|
ImportSpecialPhrases.start_import(args, SPWikiLoader(args.config))
|
||||||
with connect(args.config.get_libpq_dsn()) as db_connection:
|
|
||||||
SPImporter(
|
|
||||||
args.config, args.phplib_dir, db_connection, SPWikiLoader(args.config)
|
|
||||||
).import_phrases(tokenizer)
|
|
||||||
|
|
||||||
if args.csv_file:
|
if args.import_from_csv:
|
||||||
if not Path(args.csv_file).is_file():
|
if not Path(args.import_from_csv).is_file():
|
||||||
LOG.fatal("CSV file '%s' does not exist.", args.csv_file)
|
LOG.fatal("CSV file '%s' does not exist.", args.import_from_csv)
|
||||||
raise UsageError('Cannot access file.')
|
raise UsageError('Cannot access file.')
|
||||||
|
|
||||||
|
ImportSpecialPhrases.start_import(args, SPCsvLoader(args.import_from_csv))
|
||||||
|
|
||||||
return 0
|
return 0
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
def start_import(args, loader):
|
||||||
|
"""
|
||||||
|
Create the SPImporter object containing the right
|
||||||
|
SPLoader and then start the import of special phrases.
|
||||||
|
"""
|
||||||
|
from ..tokenizer import factory as tokenizer_factory
|
||||||
|
|
||||||
|
tokenizer = tokenizer_factory.get_tokenizer_for_db(args.config)
|
||||||
|
with connect(args.config.get_libpq_dsn()) as db_connection:
|
||||||
|
SPImporter(
|
||||||
|
args.config, args.phplib_dir, db_connection, loader
|
||||||
|
).import_phrases(tokenizer)
|
||||||
|
|||||||
@@ -2,7 +2,3 @@
|
|||||||
Module with functions for importing, updating Nominatim databases
|
Module with functions for importing, updating Nominatim databases
|
||||||
as well as general maintenance helpers.
|
as well as general maintenance helpers.
|
||||||
"""
|
"""
|
||||||
|
|
||||||
from nominatim.tools.special_phrases.sp_importer import SPImporter
|
|
||||||
from nominatim.tools.special_phrases.sp_wiki_loader import SPWikiLoader
|
|
||||||
from nominatim.tools.special_phrases.special_phrase import SpecialPhrase
|
|
||||||
|
|||||||
54
nominatim/tools/special_phrases/sp_csv_loader.py
Normal file
54
nominatim/tools/special_phrases/sp_csv_loader.py
Normal file
@@ -0,0 +1,54 @@
|
|||||||
|
"""
|
||||||
|
Module containing the SPCsvLoader class.
|
||||||
|
|
||||||
|
The class allows to load phrases from a csv file.
|
||||||
|
"""
|
||||||
|
import csv
|
||||||
|
import os
|
||||||
|
from nominatim.tools.special_phrases.special_phrase import SpecialPhrase
|
||||||
|
from nominatim.tools.special_phrases.sp_loader import SPLoader
|
||||||
|
from nominatim.errors import UsageError
|
||||||
|
|
||||||
|
class SPCsvLoader(SPLoader):
|
||||||
|
"""
|
||||||
|
Base class for special phrases loaders.
|
||||||
|
Handle the loading of special phrases from external sources.
|
||||||
|
"""
|
||||||
|
def __init__(self, csv_path):
|
||||||
|
super().__init__()
|
||||||
|
self.csv_path = csv_path
|
||||||
|
self.has_been_read = False
|
||||||
|
|
||||||
|
def __next__(self):
|
||||||
|
if self.has_been_read:
|
||||||
|
raise StopIteration()
|
||||||
|
|
||||||
|
self.has_been_read = True
|
||||||
|
SPCsvLoader.check_csv_validity(self.csv_path)
|
||||||
|
return SPCsvLoader.parse_csv(self.csv_path)
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
def parse_csv(csv_path):
|
||||||
|
"""
|
||||||
|
Open and parse the given csv file.
|
||||||
|
Create the corresponding SpecialPhrases.
|
||||||
|
"""
|
||||||
|
phrases = set()
|
||||||
|
|
||||||
|
with open(csv_path) as file:
|
||||||
|
reader = csv.DictReader(file, delimiter=',')
|
||||||
|
for row in reader:
|
||||||
|
phrases.add(
|
||||||
|
SpecialPhrase(row['phrase'], row['class'], row['type'], row['operator'])
|
||||||
|
)
|
||||||
|
return phrases
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
def check_csv_validity(csv_path):
|
||||||
|
"""
|
||||||
|
Check that the csv file has the right extension.
|
||||||
|
"""
|
||||||
|
_, extension = os.path.splitext(csv_path)
|
||||||
|
|
||||||
|
if extension != '.csv':
|
||||||
|
raise UsageError('The file {} is not a csv file.'.format(csv_path))
|
||||||
@@ -1,8 +1,8 @@
|
|||||||
"""
|
"""
|
||||||
Module containing the SPWikiLoader class.
|
Module containing the SPWikiLoader class.
|
||||||
"""
|
"""
|
||||||
import logging
|
|
||||||
import re
|
import re
|
||||||
|
import logging
|
||||||
from nominatim.tools.special_phrases.special_phrase import SpecialPhrase
|
from nominatim.tools.special_phrases.special_phrase import SpecialPhrase
|
||||||
from nominatim.tools.special_phrases.sp_loader import SPLoader
|
from nominatim.tools.special_phrases.sp_loader import SPLoader
|
||||||
from nominatim.tools.exec_utils import get_url
|
from nominatim.tools.exec_utils import get_url
|
||||||
|
|||||||
@@ -256,7 +256,7 @@ def test_index_command(mock_func_factory, temp_db_cursor, tokenizer_mock,
|
|||||||
assert rank_mock.called == do_ranks
|
assert rank_mock.called == do_ranks
|
||||||
|
|
||||||
def test_special_phrases_command(temp_db, mock_func_factory, tokenizer_mock):
|
def test_special_phrases_command(temp_db, mock_func_factory, tokenizer_mock):
|
||||||
func = mock_func_factory(nominatim.clicmd.special_phrases.SPImporter, 'import_from_wiki')
|
func = mock_func_factory(nominatim.clicmd.special_phrases.SPImporter, 'import_phrases')
|
||||||
|
|
||||||
call_nominatim('special-phrases', '--import-from-wiki')
|
call_nominatim('special-phrases', '--import-from-wiki')
|
||||||
|
|
||||||
|
|||||||
@@ -2,14 +2,15 @@
|
|||||||
Tests for import special phrases methods
|
Tests for import special phrases methods
|
||||||
of the class SPImporter.
|
of the class SPImporter.
|
||||||
"""
|
"""
|
||||||
from nominatim.tools import SpecialPhrase
|
|
||||||
from nominatim.tools import SPWikiLoader
|
|
||||||
from nominatim.errors import UsageError
|
from nominatim.errors import UsageError
|
||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
import tempfile
|
import tempfile
|
||||||
from shutil import copyfile
|
from shutil import copyfile
|
||||||
import pytest
|
import pytest
|
||||||
from nominatim.tools import SPImporter
|
from nominatim.tools.special_phrases.sp_importer import SPImporter
|
||||||
|
from nominatim.tools.special_phrases.sp_wiki_loader import SPWikiLoader
|
||||||
|
from nominatim.tools.special_phrases.sp_csv_loader import SPCsvLoader
|
||||||
|
from nominatim.tools.special_phrases.special_phrase import SpecialPhrase
|
||||||
|
|
||||||
TEST_BASE_DIR = Path(__file__) / '..' / '..'
|
TEST_BASE_DIR = Path(__file__) / '..' / '..'
|
||||||
|
|
||||||
@@ -187,7 +188,7 @@ def test_remove_non_existent_tables_from_db(sp_importer, default_phrases,
|
|||||||
def test_import_from_wiki(monkeypatch, temp_db_conn, def_config, sp_importer,
|
def test_import_from_wiki(monkeypatch, temp_db_conn, def_config, sp_importer,
|
||||||
placex_table, tokenizer_mock):
|
placex_table, tokenizer_mock):
|
||||||
"""
|
"""
|
||||||
Check that the main import_from_wiki() method is well executed.
|
Check that the main import_phrases() method is well executed.
|
||||||
It should create the place_classtype table, the place_id and centroid indexes,
|
It should create the place_classtype table, the place_id and centroid indexes,
|
||||||
grand access to the web user and executing the SQL functions for amenities.
|
grand access to the web user and executing the SQL functions for amenities.
|
||||||
It should also update the database well by deleting or preserving existing entries
|
It should also update the database well by deleting or preserving existing entries
|
||||||
@@ -200,7 +201,9 @@ def test_import_from_wiki(monkeypatch, temp_db_conn, def_config, sp_importer,
|
|||||||
CREATE TABLE place_classtype_amenity_animal_shelter();
|
CREATE TABLE place_classtype_amenity_animal_shelter();
|
||||||
CREATE TABLE place_classtype_wrongclass_wrongtype();""")
|
CREATE TABLE place_classtype_wrongclass_wrongtype();""")
|
||||||
|
|
||||||
monkeypatch.setattr('nominatim.tools.SPWikiLoader._get_wiki_content', mock_get_wiki_content)
|
monkeypatch.setattr('nominatim.tools.special_phrases.sp_wiki_loader.SPWikiLoader._get_wiki_content',
|
||||||
|
mock_get_wiki_content)
|
||||||
|
|
||||||
tokenizer = tokenizer_mock()
|
tokenizer = tokenizer_mock()
|
||||||
sp_importer.import_phrases(tokenizer)
|
sp_importer.import_phrases(tokenizer)
|
||||||
|
|
||||||
@@ -244,7 +247,7 @@ def test_import_from_wiki(monkeypatch, temp_db_conn, def_config, sp_importer,
|
|||||||
else:
|
else:
|
||||||
assert not temp_db_cursor.fetchone()
|
assert not temp_db_cursor.fetchone()
|
||||||
|
|
||||||
def mock_get_wiki_content(self, lang):
|
def mock_get_wiki_content(lang):
|
||||||
"""
|
"""
|
||||||
Mock the _get_wiki_content() method to return
|
Mock the _get_wiki_content() method to return
|
||||||
static xml test file content.
|
static xml test file content.
|
||||||
|
|||||||
Reference in New Issue
Block a user