mirror of
https://github.com/osm-search/Nominatim.git
synced 2026-02-14 18:37:58 +00:00
generalize filter for sanitizers
This commit is contained in:
@@ -302,7 +302,7 @@ class TestAllParameters:
|
||||
|
||||
def test_list_arguments_pass(self):
|
||||
res = self.run_sanitizer_on(['de', 'in'], ['20-28', '30'], [r'abc.*', r'[\s\S]*'],
|
||||
name='foo', ref_abc='foo', name_abcxx='bar', ref_pqr='baz')
|
||||
name='foo', ref='foo', name_abcxx='bar', ref_pqr='baz')
|
||||
|
||||
assert res == []
|
||||
|
||||
@@ -315,7 +315,7 @@ class TestAllParameters:
|
||||
|
||||
def test_mix_arguments_pass(self):
|
||||
res = self.run_sanitizer_on('de', ['10', '20-28', '30'], r'[\s\S]*',
|
||||
name='foo', ref_abc='foo', name_abcxx='bar', ref_pqr='baz')
|
||||
name_abc='foo', ref_abc='foo', name_abcxx='bar', ref_pqr='baz')
|
||||
|
||||
assert res == []
|
||||
|
||||
|
||||
@@ -10,17 +10,12 @@ Tests for sanitizer configuration helper functions.
|
||||
import pytest
|
||||
|
||||
from nominatim.errors import UsageError
|
||||
from nominatim.tokenizer.place_sanitizer import PlaceName
|
||||
from nominatim.tokenizer.sanitizers.config import SanitizerConfig
|
||||
|
||||
def test_string_list_default_empty():
|
||||
assert SanitizerConfig().get_string_list('op') == []
|
||||
|
||||
|
||||
def test_string_list_default_none():
|
||||
assert SanitizerConfig().get_string_list('op', default=None) is None
|
||||
|
||||
|
||||
def test_string_list_default_something():
|
||||
assert SanitizerConfig().get_string_list('op', default=['a', 'b']) == ['a', 'b']
|
||||
|
||||
@@ -78,36 +73,77 @@ def test_create_split_regex_empty_delimiter():
|
||||
regex = SanitizerConfig({'delimiters': ''}).get_delimiter()
|
||||
|
||||
|
||||
@pytest.mark.parametrize('inp', ('name', 'name:de', 'na\\me', '.*'))
|
||||
def test_create_kind_filter_no_params(inp):
|
||||
filt = SanitizerConfig().get_filter_kind()
|
||||
@pytest.mark.parametrize('inp', ('name', 'name:de', 'na\\me', '.*', ''))
|
||||
def test_create_name_filter_no_param_no_default(inp):
|
||||
filt = SanitizerConfig({'filter-kind': 'place'}).get_filter('name')
|
||||
|
||||
assert filt(inp)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('inp', ('name', 'name:de', 'na\\me', '.*', ''))
|
||||
def test_create_name_filter_no_param_default_pass_all(inp):
|
||||
filt = SanitizerConfig().get_filter('name', 'PASS_ALL')
|
||||
|
||||
assert filt(inp)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('inp', ('name', 'name:de', 'na\\me', '.*', ''))
|
||||
def test_create_name_filter_no_param_default_fail_all(inp):
|
||||
filt = SanitizerConfig().get_filter('name', 'FAIL_ALL')
|
||||
|
||||
assert not filt(inp)
|
||||
|
||||
|
||||
def test_create_name_filter_no_param_default_invalid_string():
|
||||
with pytest.raises(ValueError):
|
||||
filt = SanitizerConfig().get_filter('name', 'abc')
|
||||
|
||||
|
||||
def test_create_name_filter_no_param_default_empty_list():
|
||||
with pytest.raises(ValueError):
|
||||
filt = SanitizerConfig().get_filter('name', [])
|
||||
|
||||
|
||||
@pytest.mark.parametrize('kind', ('de', 'name:de', 'ende'))
|
||||
def test_create_kind_filter_default_positive(kind):
|
||||
filt = SanitizerConfig().get_filter('filter-kind', ['.*de'])
|
||||
|
||||
assert filt(kind)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('kind', ('de', 'name:de', 'ende'))
|
||||
def test_create_kind_filter_default_negetive(kind):
|
||||
filt = SanitizerConfig().get_filter('filter-kind', ['.*fr'])
|
||||
|
||||
assert not filt(kind)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('kind', ('lang', 'lang:de', 'langxx'))
|
||||
def test_create_kind_filter_custom_regex_positive(kind):
|
||||
filt = SanitizerConfig({'filter-kind': '.*de'}).get_filter_kind()
|
||||
filt = SanitizerConfig({'filter-kind': 'lang.*'}
|
||||
).get_filter('filter-kind', ['.*fr'])
|
||||
|
||||
assert filt(kind)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('kind', ('de ', '123', '', 'bedece'))
|
||||
def test_create_kind_filter_custom_regex_negative(kind):
|
||||
filt = SanitizerConfig({'filter-kind': '.*de'}).get_filter_kind()
|
||||
filt = SanitizerConfig({'filter-kind': '.*de'}).get_filter('filter-kind')
|
||||
|
||||
assert not filt(kind)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('kind', ('name', 'fr', 'name:fr', 'frfr', '34'))
|
||||
def test_create_kind_filter_many_positive(kind):
|
||||
filt = SanitizerConfig({'filter-kind': ['.*fr', 'name', r'\d+']}).get_filter_kind()
|
||||
filt = SanitizerConfig({'filter-kind': ['.*fr', 'name', r'\d+']}
|
||||
).get_filter('filter-kind')
|
||||
|
||||
assert filt(kind)
|
||||
|
||||
|
||||
@pytest.mark.parametrize('kind', ('name:de', 'fridge', 'a34', '.*', '\\'))
|
||||
def test_create_kind_filter_many_negative(kind):
|
||||
filt = SanitizerConfig({'filter-kind': ['.*fr', 'name', r'\d+']}).get_filter_kind()
|
||||
filt = SanitizerConfig({'filter-kind': ['.*fr', 'name', r'\d+']}
|
||||
).get_filter('filter-kind')
|
||||
|
||||
assert not filt(kind)
|
||||
|
||||
Reference in New Issue
Block a user