2010-12-13 18:55:52 +03:00
|
|
|
#!/usr/bin/php -Cq
|
|
|
|
<?php
|
|
|
|
|
2016-09-04 04:19:48 +03:00
|
|
|
require_once(dirname(dirname(__FILE__)).'/settings/settings.php');
|
|
|
|
require_once(CONST_BasePath.'/lib/init-cmd.php');
|
|
|
|
ini_set('memory_limit', '800M');
|
|
|
|
ini_set('display_errors', 'stderr');
|
|
|
|
|
2016-09-10 22:10:52 +03:00
|
|
|
$aCMDOptions
|
|
|
|
= array(
|
2017-10-26 22:21:21 +03:00
|
|
|
'Import and export special phrases',
|
2016-09-10 22:10:52 +03:00
|
|
|
array('help', 'h', 0, 1, 0, 0, false, 'Show Help'),
|
|
|
|
array('quiet', 'q', 0, 1, 0, 0, 'bool', 'Quiet output'),
|
|
|
|
array('verbose', 'v', 0, 1, 0, 0, 'bool', 'Verbose output'),
|
|
|
|
array('wiki-import', '', 0, 1, 0, 0, 'bool', 'Create import script for search phrases '),
|
|
|
|
);
|
2016-09-08 04:16:22 +03:00
|
|
|
getCmdOpt($_SERVER['argv'], $aCMDOptions, $aCMDResult, true, true);
|
2016-09-04 04:19:48 +03:00
|
|
|
|
2016-09-08 04:16:22 +03:00
|
|
|
include(CONST_InstallPath.'/settings/phrase_settings.php');
|
2016-09-04 04:19:48 +03:00
|
|
|
|
2016-09-08 04:16:22 +03:00
|
|
|
if ($aCMDResult['wiki-import']) {
|
2017-06-01 22:40:23 +03:00
|
|
|
$oNormalizer = Transliterator::createFromRules(CONST_Term_Normalization_Rules);
|
2016-09-04 04:19:48 +03:00
|
|
|
$aPairs = array();
|
|
|
|
|
2016-09-29 00:30:44 +03:00
|
|
|
$sLanguageIn = CONST_Languages ? CONST_Languages :
|
|
|
|
('af,ar,br,ca,cs,de,en,es,et,eu,fa,fi,fr,gl,hr,hu,'.
|
|
|
|
'ia,is,it,ja,mk,nl,no,pl,ps,pt,ru,sk,sl,sv,uk,vi');
|
|
|
|
|
|
|
|
foreach (explode(',', $sLanguageIn) as $sLanguage) {
|
2018-01-06 00:38:51 +03:00
|
|
|
$sURL = 'https://wiki.openstreetmap.org/wiki/Special:Export/Nominatim/Special_Phrases/'.strtoupper($sLanguage);
|
2016-09-04 04:19:48 +03:00
|
|
|
$sWikiPageXML = file_get_contents($sURL);
|
2016-09-08 04:16:22 +03:00
|
|
|
if (preg_match_all('#\\| ([^|]+) \\|\\| ([^|]+) \\|\\| ([^|]+) \\|\\| ([^|]+) \\|\\| ([\\-YN])#', $sWikiPageXML, $aMatches, PREG_SET_ORDER)) {
|
|
|
|
foreach ($aMatches as $aMatch) {
|
2016-09-04 04:19:48 +03:00
|
|
|
$sLabel = trim($aMatch[1]);
|
2017-06-01 22:40:23 +03:00
|
|
|
if ($oNormalizer !== null) {
|
|
|
|
$sTrans = pg_escape_string($oNormalizer->transliterate($sLabel));
|
|
|
|
} else {
|
|
|
|
$sTrans = null;
|
|
|
|
}
|
2016-09-04 04:19:48 +03:00
|
|
|
$sClass = trim($aMatch[2]);
|
|
|
|
$sType = trim($aMatch[3]);
|
2016-09-14 04:16:46 +03:00
|
|
|
// hack around a bug where building=yes was imported with
|
|
|
|
// quotes into the wiki
|
2016-09-04 04:19:48 +03:00
|
|
|
$sType = preg_replace('/"/', '', $sType);
|
2016-09-14 04:16:46 +03:00
|
|
|
// sanity check, in case somebody added garbage in the wiki
|
2016-09-11 06:22:51 +03:00
|
|
|
if (preg_match('/^\\w+$/', $sClass) < 1
|
|
|
|
|| preg_match('/^\\w+$/', $sType) < 1
|
|
|
|
) {
|
2016-09-04 04:19:48 +03:00
|
|
|
trigger_error("Bad class/type for language $sLanguage: $sClass=$sType");
|
|
|
|
exit;
|
|
|
|
}
|
2016-09-14 04:16:46 +03:00
|
|
|
// blacklisting: disallow certain class/type combinations
|
2016-09-04 04:19:48 +03:00
|
|
|
if (isset($aTagsBlacklist[$sClass]) && in_array($sType, $aTagsBlacklist[$sClass])) {
|
2016-09-14 04:16:46 +03:00
|
|
|
// fwrite(STDERR, "Blacklisted: ".$sClass."/".$sType."\n");
|
2016-09-04 04:19:48 +03:00
|
|
|
continue;
|
|
|
|
}
|
2016-09-14 04:16:46 +03:00
|
|
|
// whitelisting: if class is in whitelist, allow only tags in the list
|
2016-09-04 04:19:48 +03:00
|
|
|
if (isset($aTagsWhitelist[$sClass]) && !in_array($sType, $aTagsWhitelist[$sClass])) {
|
2016-09-14 04:16:46 +03:00
|
|
|
// fwrite(STDERR, "Non-Whitelisted: ".$sClass."/".$sType."\n");
|
2016-09-04 04:19:48 +03:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
$aPairs[$sClass.'|'.$sType] = array($sClass, $sType);
|
|
|
|
|
2016-09-08 04:16:22 +03:00
|
|
|
switch (trim($aMatch[4])) {
|
|
|
|
case 'near':
|
2017-06-01 20:34:16 +03:00
|
|
|
echo "select getorcreate_amenityoperator(make_standard_name('".pg_escape_string($sLabel)."'), '$sTrans', '$sClass', '$sType', 'near');\n";
|
2016-09-08 04:16:22 +03:00
|
|
|
break;
|
|
|
|
case 'in':
|
2017-06-01 20:34:16 +03:00
|
|
|
echo "select getorcreate_amenityoperator(make_standard_name('".pg_escape_string($sLabel)."'), '$sTrans', '$sClass', '$sType', 'in');\n";
|
2016-09-08 04:16:22 +03:00
|
|
|
break;
|
|
|
|
default:
|
2017-06-01 20:34:16 +03:00
|
|
|
echo "select getorcreate_amenity(make_standard_name('".pg_escape_string($sLabel)."'), '$sTrans', '$sClass', '$sType');\n";
|
2016-09-08 04:16:22 +03:00
|
|
|
break;
|
2016-09-04 04:19:48 +03:00
|
|
|
}
|
|
|
|
}
|
2012-02-27 00:32:40 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-10-26 22:21:21 +03:00
|
|
|
echo 'create index idx_placex_classtype on placex (class, type);';
|
2016-09-04 04:19:48 +03:00
|
|
|
|
2016-09-08 04:16:22 +03:00
|
|
|
foreach ($aPairs as $aPair) {
|
2017-10-26 22:21:21 +03:00
|
|
|
echo 'create table place_classtype_'.pg_escape_string($aPair[0]).'_'.pg_escape_string($aPair[1]);
|
2016-09-04 04:19:48 +03:00
|
|
|
if (CONST_Tablespace_Aux_Data)
|
2017-10-26 22:21:21 +03:00
|
|
|
echo ' tablespace '.CONST_Tablespace_Aux_Data;
|
|
|
|
echo ' as select place_id as place_id,st_centroid(geometry) as centroid from placex where ';
|
2016-09-04 04:19:48 +03:00
|
|
|
echo "class = '".pg_escape_string($aPair[0])."' and type = '".pg_escape_string($aPair[1])."'";
|
|
|
|
echo ";\n";
|
|
|
|
|
2017-10-26 22:21:21 +03:00
|
|
|
echo 'CREATE INDEX idx_place_classtype_'.pg_escape_string($aPair[0]).'_'.pg_escape_string($aPair[1]).'_centroid ';
|
|
|
|
echo 'ON place_classtype_'.pg_escape_string($aPair[0]).'_'.pg_escape_string($aPair[1]).' USING GIST (centroid)';
|
2016-09-04 04:19:48 +03:00
|
|
|
if (CONST_Tablespace_Aux_Index)
|
2017-10-26 22:21:21 +03:00
|
|
|
echo ' tablespace '.CONST_Tablespace_Aux_Index;
|
2016-09-04 04:19:48 +03:00
|
|
|
echo ";\n";
|
|
|
|
|
2017-10-26 22:21:21 +03:00
|
|
|
echo 'CREATE INDEX idx_place_classtype_'.pg_escape_string($aPair[0]).'_'.pg_escape_string($aPair[1]).'_place_id ';
|
|
|
|
echo 'ON place_classtype_'.pg_escape_string($aPair[0]).'_'.pg_escape_string($aPair[1]).' USING btree(place_id)';
|
2016-09-04 04:19:48 +03:00
|
|
|
if (CONST_Tablespace_Aux_Index)
|
2017-10-26 22:21:21 +03:00
|
|
|
echo ' tablespace '.CONST_Tablespace_Aux_Index;
|
2016-09-04 04:19:48 +03:00
|
|
|
echo ";\n";
|
|
|
|
|
2017-10-26 22:21:21 +03:00
|
|
|
echo 'GRANT SELECT ON place_classtype_'.pg_escape_string($aPair[0]).'_'.pg_escape_string($aPair[1]).' TO "'.CONST_Database_Web_User."\";\n";
|
2016-09-04 04:19:48 +03:00
|
|
|
}
|
|
|
|
|
2017-10-26 22:21:21 +03:00
|
|
|
echo 'drop index idx_placex_classtype;';
|
2016-09-04 04:19:48 +03:00
|
|
|
}
|