mirror of
https://github.com/osm-search/Nominatim.git
synced 2024-12-25 14:02:12 +03:00
781e83ddc3
The variable shadowing causes bad results when used with LuaJIT.
555 lines
14 KiB
Lua
555 lines
14 KiB
Lua
-- Core functions for Nominatim import flex style.
|
|
--
|
|
|
|
local module = {}
|
|
|
|
local PRE_DELETE = nil
|
|
local PRE_EXTRAS = nil
|
|
local POST_DELETE = nil
|
|
local MAIN_KEYS = nil
|
|
local NAMES = nil
|
|
local ADDRESS_TAGS = nil
|
|
local SAVE_EXTRA_MAINS = false
|
|
local POSTCODE_FALLBACK = true
|
|
|
|
-- tables required for taginfo
|
|
module.TAGINFO_MAIN = {keys = {}, delete_tags = {}}
|
|
module.TAGINFO_NAME_KEYS = {}
|
|
module.TAGINFO_ADDRESS_KEYS = {}
|
|
|
|
|
|
-- The single place table.
|
|
local place_table = osm2pgsql.define_table{
|
|
name = "place",
|
|
ids = { type = 'any', id_column = 'osm_id', type_column = 'osm_type' },
|
|
columns = {
|
|
{ column = 'class', type = 'text', not_null = true },
|
|
{ column = 'type', type = 'text', not_null = true },
|
|
{ column = 'admin_level', type = 'smallint' },
|
|
{ column = 'name', type = 'hstore' },
|
|
{ column = 'address', type = 'hstore' },
|
|
{ column = 'extratags', type = 'hstore' },
|
|
{ column = 'geometry', type = 'geometry', projection = 'WGS84', not_null = true },
|
|
},
|
|
data_tablespace = os.getenv("NOMINATIM_TABLESPACE_PLACE_DATA"),
|
|
index_tablespace = os.getenv("NOMINATIM_TABLESPACE_PLACE_INDEX"),
|
|
indexes = {}
|
|
}
|
|
|
|
------------ Geometry functions for relations ---------------------
|
|
|
|
function module.relation_as_multipolygon(o)
|
|
return o:as_multipolygon()
|
|
end
|
|
|
|
function module.relation_as_multiline(o)
|
|
return o:as_multilinestring():line_merge()
|
|
end
|
|
|
|
|
|
module.RELATION_TYPES = {
|
|
multipolygon = module.relation_as_multipolygon,
|
|
boundary = module.relation_as_multipolygon,
|
|
waterway = module.relation_as_multiline
|
|
}
|
|
|
|
------------- Place class ------------------------------------------
|
|
|
|
local Place = {}
|
|
Place.__index = Place
|
|
|
|
function Place.new(object, geom_func)
|
|
local self = setmetatable({}, Place)
|
|
self.object = object
|
|
self.geom_func = geom_func
|
|
|
|
self.admin_level = tonumber(self.object:grab_tag('admin_level'))
|
|
if self.admin_level == nil
|
|
or self.admin_level <= 0 or self.admin_level > 15
|
|
or math.floor(self.admin_level) ~= self.admin_level then
|
|
self.admin_level = 15
|
|
end
|
|
|
|
self.num_entries = 0
|
|
self.has_name = false
|
|
self.names = {}
|
|
self.address = {}
|
|
self.extratags = {}
|
|
|
|
return self
|
|
end
|
|
|
|
function Place:clean(data)
|
|
for k, v in pairs(self.object.tags) do
|
|
if data.delete ~= nil and data.delete(k, v) then
|
|
self.object.tags[k] = nil
|
|
elseif data.extra ~= nil and data.extra(k, v) then
|
|
self.extratags[k] = v
|
|
self.object.tags[k] = nil
|
|
end
|
|
end
|
|
end
|
|
|
|
function Place:delete(data)
|
|
if data.match ~= nil then
|
|
for k, v in pairs(self.object.tags) do
|
|
if data.match(k, v) then
|
|
self.object.tags[k] = nil
|
|
end
|
|
end
|
|
end
|
|
end
|
|
|
|
function Place:grab_extratags(data)
|
|
local count = 0
|
|
|
|
if data.match ~= nil then
|
|
for k, v in pairs(self.object.tags) do
|
|
if data.match(k, v) then
|
|
self.object.tags[k] = nil
|
|
self.extratags[k] = v
|
|
count = count + 1
|
|
end
|
|
end
|
|
end
|
|
|
|
return count
|
|
end
|
|
|
|
local function strip_address_prefix(k)
|
|
if k:sub(1, 5) == 'addr:' then
|
|
return k:sub(6)
|
|
end
|
|
|
|
if k:sub(1, 6) == 'is_in:' then
|
|
return k:sub(7)
|
|
end
|
|
|
|
return k
|
|
end
|
|
|
|
|
|
function Place:grab_address_parts(data)
|
|
local count = 0
|
|
|
|
if data.groups ~= nil then
|
|
for k, v in pairs(self.object.tags) do
|
|
local atype = data.groups(k, v)
|
|
|
|
if atype ~= nil then
|
|
if atype == 'main' then
|
|
self.has_name = true
|
|
self.address[strip_address_prefix(k)] = v
|
|
count = count + 1
|
|
elseif atype == 'extra' then
|
|
self.address[strip_address_prefix(k)] = v
|
|
else
|
|
self.address[atype] = v
|
|
end
|
|
self.object.tags[k] = nil
|
|
end
|
|
end
|
|
end
|
|
|
|
return count
|
|
end
|
|
|
|
|
|
function Place:grab_name_parts(data)
|
|
local fallback = nil
|
|
|
|
if data.groups ~= nil then
|
|
for k, v in pairs(self.object.tags) do
|
|
local atype = data.groups(k, v)
|
|
|
|
if atype ~= nil then
|
|
self.names[k] = v
|
|
self.object.tags[k] = nil
|
|
if atype == 'main' then
|
|
self.has_name = true
|
|
elseif atype == 'house' then
|
|
self.has_name = true
|
|
fallback = {'place', 'house', 'always'}
|
|
end
|
|
end
|
|
end
|
|
end
|
|
|
|
return fallback
|
|
end
|
|
|
|
|
|
function Place:write_place(k, v, mtype, save_extra_mains)
|
|
if mtype == nil then
|
|
return 0
|
|
end
|
|
|
|
v = v or self.object.tags[k]
|
|
if v == nil then
|
|
return 0
|
|
end
|
|
|
|
if type(mtype) == 'table' then
|
|
mtype = mtype[v] or mtype[1]
|
|
end
|
|
|
|
if mtype == 'always' or (self.has_name and mtype == 'named') then
|
|
return self:write_row(k, v, save_extra_mains)
|
|
end
|
|
|
|
if mtype == 'named_with_key' then
|
|
local names = {}
|
|
local prefix = k .. ':name'
|
|
for namek, namev in pairs(self.object.tags) do
|
|
if namek:sub(1, #prefix) == prefix
|
|
and (#namek == #prefix
|
|
or namek:sub(#prefix + 1, #prefix + 1) == ':') then
|
|
names[namek:sub(#k + 2)] = namev
|
|
end
|
|
end
|
|
|
|
if next(names) ~= nil then
|
|
local saved_names = self.names
|
|
self.names = names
|
|
|
|
local results = self:write_row(k, v, save_extra_mains)
|
|
|
|
self.names = saved_names
|
|
|
|
return results
|
|
end
|
|
end
|
|
|
|
return 0
|
|
end
|
|
|
|
function Place:write_row(k, v, save_extra_mains)
|
|
if self.geometry == nil then
|
|
self.geometry = self.geom_func(self.object)
|
|
end
|
|
if self.geometry:is_null() then
|
|
return 0
|
|
end
|
|
|
|
if save_extra_mains ~= nil then
|
|
for extra_k, extra_v in pairs(self.object.tags) do
|
|
if extra_k ~= k and save_extra_mains(extra_k, extra_v) then
|
|
self.extratags[extra_k] = extra_v
|
|
end
|
|
end
|
|
end
|
|
|
|
place_table:insert{
|
|
class = k,
|
|
type = v,
|
|
admin_level = self.admin_level,
|
|
name = next(self.names) and self.names,
|
|
address = next(self.address) and self.address,
|
|
extratags = next(self.extratags) and self.extratags,
|
|
geometry = self.geometry
|
|
}
|
|
|
|
if save_extra_mains then
|
|
for tk, tv in pairs(self.object.tags) do
|
|
if save_extra_mains(tk, tv) then
|
|
self.extratags[tk] = nil
|
|
end
|
|
end
|
|
end
|
|
|
|
self.num_entries = self.num_entries + 1
|
|
|
|
return 1
|
|
end
|
|
|
|
|
|
function module.tag_match(data)
|
|
if data == nil or next(data) == nil then
|
|
return nil
|
|
end
|
|
|
|
local fullmatches = {}
|
|
local key_prefixes = {}
|
|
local key_suffixes = {}
|
|
|
|
if data.keys ~= nil then
|
|
for _, key in pairs(data.keys) do
|
|
if key:sub(1, 1) == '*' then
|
|
if #key > 1 then
|
|
if key_suffixes[#key - 1] == nil then
|
|
key_suffixes[#key - 1] = {}
|
|
end
|
|
key_suffixes[#key - 1][key:sub(2)] = true
|
|
end
|
|
elseif key:sub(#key, #key) == '*' then
|
|
if key_prefixes[#key - 1] == nil then
|
|
key_prefixes[#key - 1] = {}
|
|
end
|
|
key_prefixes[#key - 1][key:sub(1, #key - 1)] = true
|
|
else
|
|
fullmatches[key] = true
|
|
end
|
|
end
|
|
end
|
|
|
|
if data.tags ~= nil then
|
|
for k, vlist in pairs(data.tags) do
|
|
if fullmatches[k] == nil then
|
|
fullmatches[k] = {}
|
|
for _, v in pairs(vlist) do
|
|
fullmatches[k][v] = true
|
|
end
|
|
end
|
|
end
|
|
end
|
|
|
|
return function (k, v)
|
|
if fullmatches[k] ~= nil and (fullmatches[k] == true or fullmatches[k][v] ~= nil) then
|
|
return true
|
|
end
|
|
|
|
for slen, slist in pairs(key_suffixes) do
|
|
if #k >= slen and slist[k:sub(-slen)] ~= nil then
|
|
return true
|
|
end
|
|
end
|
|
|
|
for slen, slist in pairs(key_prefixes) do
|
|
if #k >= slen and slist[k:sub(1, slen)] ~= nil then
|
|
return true
|
|
end
|
|
end
|
|
|
|
return false
|
|
end
|
|
end
|
|
|
|
|
|
function module.tag_group(data)
|
|
if data == nil or next(data) == nil then
|
|
return nil
|
|
end
|
|
|
|
local fullmatches = {}
|
|
local key_prefixes = {}
|
|
local key_suffixes = {}
|
|
|
|
for group, tags in pairs(data) do
|
|
for _, key in pairs(tags) do
|
|
if key:sub(1, 1) == '*' then
|
|
if #key > 1 then
|
|
if key_suffixes[#key - 1] == nil then
|
|
key_suffixes[#key - 1] = {}
|
|
end
|
|
key_suffixes[#key - 1][key:sub(2)] = group
|
|
end
|
|
elseif key:sub(#key, #key) == '*' then
|
|
if key_prefixes[#key - 1] == nil then
|
|
key_prefixes[#key - 1] = {}
|
|
end
|
|
key_prefixes[#key - 1][key:sub(1, #key - 1)] = group
|
|
else
|
|
fullmatches[key] = group
|
|
end
|
|
end
|
|
end
|
|
|
|
return function (k, v)
|
|
local val = fullmatches[k]
|
|
if val ~= nil then
|
|
return val
|
|
end
|
|
|
|
for slen, slist in pairs(key_suffixes) do
|
|
if #k >= slen then
|
|
val = slist[k:sub(-slen)]
|
|
if val ~= nil then
|
|
return val
|
|
end
|
|
end
|
|
end
|
|
|
|
for slen, slist in pairs(key_prefixes) do
|
|
if #k >= slen then
|
|
val = slist[k:sub(1, slen)]
|
|
if val ~= nil then
|
|
return val
|
|
end
|
|
end
|
|
end
|
|
end
|
|
end
|
|
|
|
-- Returns prefix part of the keys, and reject suffix matching keys
|
|
local function process_key(key)
|
|
if key:sub(1, 1) == '*' then
|
|
return nil
|
|
end
|
|
if key:sub(#key, #key) == '*' then
|
|
return key:sub(1, #key - 2)
|
|
end
|
|
return key
|
|
end
|
|
|
|
-- Process functions for all data types
|
|
function module.process_node(object)
|
|
|
|
local function geom_func(o)
|
|
return o:as_point()
|
|
end
|
|
|
|
module.process_tags(Place.new(object, geom_func))
|
|
end
|
|
|
|
function module.process_way(object)
|
|
|
|
local function geom_func(o)
|
|
local geom = o:as_polygon()
|
|
|
|
if geom:is_null() then
|
|
geom = o:as_linestring()
|
|
end
|
|
|
|
return geom
|
|
end
|
|
|
|
module.process_tags(Place.new(object, geom_func))
|
|
end
|
|
|
|
function module.process_relation(object)
|
|
local geom_func = module.RELATION_TYPES[object.tags.type]
|
|
|
|
if geom_func ~= nil then
|
|
module.process_tags(Place.new(object, geom_func))
|
|
end
|
|
end
|
|
|
|
-- The process functions are used by default by osm2pgsql.
|
|
osm2pgsql.process_node = module.process_node
|
|
osm2pgsql.process_way = module.process_way
|
|
osm2pgsql.process_relation = module.process_relation
|
|
|
|
function module.process_tags(o)
|
|
o:clean{delete = PRE_DELETE, extra = PRE_EXTRAS}
|
|
|
|
-- Exception for boundary/place double tagging
|
|
if o.object.tags.boundary == 'administrative' then
|
|
o:grab_extratags{match = function (k, v)
|
|
return k == 'place' and v:sub(1,3) ~= 'isl'
|
|
end}
|
|
end
|
|
|
|
-- name keys
|
|
local fallback = o:grab_name_parts{groups=NAMES}
|
|
|
|
-- address keys
|
|
if o:grab_address_parts{groups=ADDRESS_TAGS} > 0 and fallback == nil then
|
|
fallback = {'place', 'house', 'always'}
|
|
end
|
|
if o.address.country ~= nil and #o.address.country ~= 2 then
|
|
o.address['country'] = nil
|
|
end
|
|
if POSTCODE_FALLBACK and fallback == nil and o.address.postcode ~= nil then
|
|
fallback = {'place', 'postcode', 'always'}
|
|
end
|
|
|
|
if o.address.interpolation ~= nil then
|
|
o:write_place('place', 'houses', 'always', SAVE_EXTRA_MAINS)
|
|
return
|
|
end
|
|
|
|
o:clean{delete = POST_DELETE}
|
|
|
|
-- collect main keys
|
|
for k, v in pairs(o.object.tags) do
|
|
local ktype = MAIN_KEYS[k]
|
|
if ktype == 'fallback' then
|
|
if o.has_name then
|
|
fallback = {k, v, 'named'}
|
|
end
|
|
elseif ktype ~= nil then
|
|
o:write_place(k, v, MAIN_KEYS[k], SAVE_EXTRA_MAINS)
|
|
end
|
|
end
|
|
|
|
if fallback ~= nil and o.num_entries == 0 then
|
|
o:write_place(fallback[1], fallback[2], fallback[3], SAVE_EXTRA_MAINS)
|
|
end
|
|
end
|
|
|
|
--------- Convenience functions for simple style configuration -----------------
|
|
|
|
|
|
function module.set_prefilters(data)
|
|
PRE_DELETE = module.tag_match{keys = data.delete_keys, tags = data.delete_tags}
|
|
PRE_EXTRAS = module.tag_match{keys = data.extra_keys,
|
|
tags = data.extra_tags}
|
|
module.TAGINFO_MAIN.delete_tags = data.delete_tags
|
|
end
|
|
|
|
function module.set_main_tags(data)
|
|
MAIN_KEYS = data
|
|
local keys = {}
|
|
for k, _ in pairs(data) do
|
|
table.insert(keys, k)
|
|
end
|
|
module.TAGINFO_MAIN.keys = keys
|
|
end
|
|
|
|
function module.set_name_tags(data)
|
|
NAMES = module.tag_group(data)
|
|
|
|
for _, lst in pairs(data) do
|
|
for _, k in ipairs(lst) do
|
|
local key = process_key(k)
|
|
if key ~= nil then
|
|
module.TAGINFO_NAME_KEYS[key] = true
|
|
end
|
|
end
|
|
end
|
|
end
|
|
|
|
function module.set_address_tags(data)
|
|
if data.postcode_fallback ~= nil then
|
|
POSTCODE_FALLBACK = data.postcode_fallback
|
|
data.postcode_fallback = nil
|
|
end
|
|
ADDRESS_TAGS = module.tag_group(data)
|
|
|
|
for _, lst in pairs(data) do
|
|
if lst ~= nil then
|
|
for _, k in ipairs(lst) do
|
|
local key = process_key(k)
|
|
if key ~= nil then
|
|
module.TAGINFO_ADDRESS_KEYS[key] = true
|
|
end
|
|
end
|
|
end
|
|
end
|
|
end
|
|
|
|
function module.set_unused_handling(data)
|
|
if data.extra_keys == nil and data.extra_tags == nil then
|
|
POST_DELETE = module.tag_match{keys = data.delete_keys, tags = data.delete_tags}
|
|
SAVE_EXTRA_MAINS = function() return true end
|
|
elseif data.delete_keys == nil and data.delete_tags == nil then
|
|
POST_DELETE = nil
|
|
SAVE_EXTRA_MAINS = module.tag_match{keys = data.extra_keys, tags = data.extra_tags}
|
|
else
|
|
error("unused handler can have only 'extra_keys' or 'delete_keys' set.")
|
|
end
|
|
end
|
|
|
|
function module.set_relation_types(data)
|
|
module.RELATION_TYPES = {}
|
|
for k, v in data do
|
|
if v == 'multipolygon' then
|
|
module.RELATION_TYPES[k] = module.relation_as_multipolygon
|
|
elseif v == 'multiline' then
|
|
module.RELATION_TYPES[k] = module.relation_as_multiline
|
|
end
|
|
end
|
|
end
|
|
|
|
return module
|