add tests for new full name computation with ICU

This commit is contained in:
Sarah Hoffmann 2021-05-24 10:29:21 +02:00
parent 4f4d15c28a
commit 24c986c842
3 changed files with 7 additions and 16 deletions

View File

@ -537,8 +537,6 @@ class _TokenInfo:
"""
# Start with all partial names
terms = set((part for ns in names for part in ns.split()))
# Add partials for the full terms (TO BE REMOVED)
terms.update((n for n in names))
# Add the full names
terms.update((' ' + n for n in names))

View File

@ -4,8 +4,8 @@ no-test-db: bdd-no-test-db php
bdd:
cd bdd && behave -DREMOVE_TEMPLATE=1
bdd-no-test-db:
cd bdd && behave -DREMOVE_TEMPLATE=1 db osm2pgsql
icu:
cd bdd && behave -DREMOVE_TEMPLATE=1 -DTOKENIZER=legacy_icu
php:
cd php && phpunit ./

View File

@ -232,23 +232,16 @@ def test_process_place_names(analyzer, getorcreate_term_id):
@pytest.mark.parametrize('sep', [',' , ';'])
def test_full_names_with_separator(analyzer, getorcreate_term_id, sep):
with analyzer() as anl:
full_names =
anl._compute_full_names({'name' : sep.join(('New York', 'Big Apple'))})
names = anl._compute_full_names({'name' : sep.join(('New York', 'Big Apple'))})
expect = set((anl.make_standard_word(w) for w in ('New York', 'Big Apple')))
assert full_names == expect
assert names == set(('NEW YORK', 'BIG APPLE'))
def test_process_place_names_with_bracket(analyzer, getorcreate_term_id):
def test_full_names_with_bracket(analyzer, getorcreate_term_id):
with analyzer() as anl:
info = anl.process_place({'name' :
{'name' : 'Houseboat (left)'}})
names = anl._compute_full_names({'name' : 'Houseboat (left)'})
expect = set((anl.make_standard_word(w) for w in
(' houseboat', ' houseboat left', 'houseboat', 'left')))
assert eval(info['names']) == expect
assert names == set(('HOUSEBOAT (LEFT)', 'HOUSEBOAT'))
@pytest.mark.parametrize('pcode', ['12345', 'AB 123', '34-345'])