mirror of
https://github.com/osm-search/Nominatim.git
synced 2024-12-26 06:22:13 +03:00
101 lines
3.8 KiB
Python
101 lines
3.8 KiB
Python
# SPDX-License-Identifier: GPL-2.0-only
|
|
#
|
|
# This file is part of Nominatim. (https://nominatim.org)
|
|
#
|
|
# Copyright (C) 2022 by the Nominatim developer community.
|
|
# For a full list of authors see the git log.
|
|
"""
|
|
Legacy word table for testing with functions to prefil and test contents
|
|
of the table.
|
|
"""
|
|
|
|
class MockLegacyWordTable:
|
|
""" A word table for testing using legacy word table structure.
|
|
"""
|
|
def __init__(self, conn):
|
|
self.conn = conn
|
|
with conn.cursor() as cur:
|
|
cur.execute("""CREATE TABLE word (word_id INTEGER,
|
|
word_token text,
|
|
word text,
|
|
class text,
|
|
type text,
|
|
country_code varchar(2),
|
|
search_name_count INTEGER,
|
|
operator TEXT)""")
|
|
|
|
conn.commit()
|
|
|
|
def add_full_word(self, word_id, word, word_token=None):
|
|
with self.conn.cursor() as cur:
|
|
cur.execute("""INSERT INTO word (word_id, word_token, word)
|
|
VALUES (%s, %s, %s)
|
|
""", (word_id, ' ' + (word_token or word), word))
|
|
self.conn.commit()
|
|
|
|
|
|
def add_special(self, word_token, word, cls, typ, oper):
|
|
with self.conn.cursor() as cur:
|
|
cur.execute("""INSERT INTO word (word_token, word, class, type, operator)
|
|
VALUES (%s, %s, %s, %s, %s)
|
|
""", (word_token, word, cls, typ, oper))
|
|
self.conn.commit()
|
|
|
|
|
|
def add_country(self, country_code, word_token):
|
|
with self.conn.cursor() as cur:
|
|
cur.execute("INSERT INTO word (word_token, country_code) VALUES(%s, %s)",
|
|
(word_token, country_code))
|
|
self.conn.commit()
|
|
|
|
|
|
def add_postcode(self, word_token, postcode):
|
|
with self.conn.cursor() as cur:
|
|
cur.execute("""INSERT INTO word (word_token, word, class, type)
|
|
VALUES (%s, %s, 'place', 'postcode')
|
|
""", (word_token, postcode))
|
|
self.conn.commit()
|
|
|
|
|
|
def count(self):
|
|
with self.conn.cursor() as cur:
|
|
return cur.scalar("SELECT count(*) FROM word")
|
|
|
|
|
|
def count_special(self):
|
|
with self.conn.cursor() as cur:
|
|
return cur.scalar("SELECT count(*) FROM word WHERE class != 'place'")
|
|
|
|
|
|
def get_special(self):
|
|
with self.conn.cursor() as cur:
|
|
cur.execute("""SELECT word_token, word, class, type, operator
|
|
FROM word WHERE class != 'place'""")
|
|
result = set((tuple(row) for row in cur))
|
|
assert len(result) == cur.rowcount, "Word table has duplicates."
|
|
return result
|
|
|
|
|
|
def get_country(self):
|
|
with self.conn.cursor() as cur:
|
|
cur.execute("""SELECT country_code, word_token
|
|
FROM word WHERE country_code is not null""")
|
|
result = set((tuple(row) for row in cur))
|
|
assert len(result) == cur.rowcount, "Word table has duplicates."
|
|
return result
|
|
|
|
|
|
def get_postcodes(self):
|
|
with self.conn.cursor() as cur:
|
|
cur.execute("""SELECT word FROM word
|
|
WHERE class = 'place' and type = 'postcode'""")
|
|
return set((row[0] for row in cur))
|
|
|
|
def get_partial_words(self):
|
|
with self.conn.cursor() as cur:
|
|
cur.execute("""SELECT word_token, search_name_count FROM word
|
|
WHERE class is null and country_code is null
|
|
and not word_token like ' %'""")
|
|
return set((tuple(row) for row in cur))
|
|
|