2010-10-24 03:12:37 +04:00
#!/usr/bin/php -Cq
< ? php
2016-09-04 04:19:48 +03:00
require_once ( dirname ( dirname ( __FILE__ )) . '/settings/settings.php' );
require_once ( CONST_BasePath . '/lib/init-cmd.php' );
ini_set ( 'memory_limit' , '800M' );
2016-09-10 22:10:52 +03:00
$aCMDOptions
= array (
" Create and setup nominatim search system " ,
array ( 'help' , 'h' , 0 , 1 , 0 , 0 , false , 'Show Help' ),
array ( 'quiet' , 'q' , 0 , 1 , 0 , 0 , 'bool' , 'Quiet output' ),
array ( 'verbose' , 'v' , 0 , 1 , 0 , 0 , 'bool' , 'Verbose output' ),
array ( 'osm-file' , '' , 0 , 1 , 1 , 1 , 'realpath' , 'File to import' ),
array ( 'threads' , '' , 0 , 1 , 1 , 1 , 'int' , 'Number of threads (where possible)' ),
array ( 'all' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Do the complete process' ),
array ( 'create-db' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Create nominatim db' ),
array ( 'setup-db' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Build a blank nominatim db' ),
array ( 'import-data' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import a osm file' ),
array ( 'osm2pgsql-cache' , '' , 0 , 1 , 1 , 1 , 'int' , 'Cache size used by osm2pgsql' ),
array ( 'create-functions' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Create functions' ),
array ( 'enable-diff-updates' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Turn on the code required to make diff updates work' ),
array ( 'enable-debug-statements' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Include debug warning statements in pgsql commands' ),
array ( 'ignore-errors' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Continue import even when errors in SQL are present (EXPERT)' ),
array ( 'create-tables' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Create main tables' ),
array ( 'create-partition-tables' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Create required partition tables' ),
array ( 'create-partition-functions' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Create required partition triggers' ),
array ( 'no-partitions' , '' , 0 , 1 , 0 , 0 , 'bool' , " Do not partition search indices (speeds up import of single country extracts) " ),
array ( 'import-wikipedia-articles' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import wikipedia article dump' ),
array ( 'load-data' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Copy data to live tables from import table' ),
array ( 'disable-token-precalc' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Disable name precalculation (EXPERT)' ),
array ( 'import-tiger-data' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import tiger data (not included in \'all\')' ),
array ( 'calculate-postcodes' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Calculate postcode centroids' ),
array ( 'osmosis-init' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Generate default osmosis configuration' ),
array ( 'index' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Index the data' ),
array ( 'index-noanalyse' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Do not perform analyse operations during index (EXPERT)' ),
array ( 'create-search-indices' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Create additional indices required for search and update' ),
2016-09-29 00:30:44 +03:00
array ( 'create-country-names' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Create default list of searchable country names' ),
2016-09-10 22:10:52 +03:00
array ( 'drop' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Drop tables needed for updates, making the database readonly (EXPERIMENTAL)' ),
);
2016-09-04 04:19:48 +03:00
getCmdOpt ( $_SERVER [ 'argv' ], $aCMDOptions , $aCMDResult , true , true );
$bDidSomething = false ;
// Check if osm-file is set and points to a valid file if --all or --import-data is given
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'import-data' ] || $aCMDResult [ 'all' ]) {
if ( ! isset ( $aCMDResult [ 'osm-file' ])) {
2016-09-04 04:19:48 +03:00
fail ( 'missing --osm-file for data import' );
}
2016-09-08 04:16:22 +03:00
if ( ! file_exists ( $aCMDResult [ 'osm-file' ])) {
2016-09-04 04:19:48 +03:00
fail ( 'the path supplied to --osm-file does not exist' );
}
2016-09-08 04:16:22 +03:00
if ( ! is_readable ( $aCMDResult [ 'osm-file' ])) {
2016-09-04 04:19:48 +03:00
fail ( 'osm-file "' . $aCMDResult [ 'osm-file' ] . '" not readable' );
}
}
// This is a pretty hard core default - the number of processors in the box - 1
$iInstances = isset ( $aCMDResult [ 'threads' ]) ? $aCMDResult [ 'threads' ] : ( getProcessorCount () - 1 );
2016-09-08 04:16:22 +03:00
if ( $iInstances < 1 ) {
2016-09-04 04:19:48 +03:00
$iInstances = 1 ;
echo " WARNING: resetting threads to $iInstances\n " ;
}
2016-09-08 04:16:22 +03:00
if ( $iInstances > getProcessorCount ()) {
2016-09-04 04:19:48 +03:00
$iInstances = getProcessorCount ();
echo " WARNING: resetting threads to $iInstances\n " ;
}
// Assume we can steal all the cache memory in the box (unless told otherwise)
2016-09-08 04:16:22 +03:00
if ( isset ( $aCMDResult [ 'osm2pgsql-cache' ])) {
2016-09-04 04:19:48 +03:00
$iCacheMemory = $aCMDResult [ 'osm2pgsql-cache' ];
2016-09-08 04:16:22 +03:00
} else {
2016-09-04 04:19:48 +03:00
$iCacheMemory = getCacheMemoryMB ();
}
$aDSNInfo = DB :: parseDSN ( CONST_Database_DSN );
if ( ! isset ( $aDSNInfo [ 'port' ]) || ! $aDSNInfo [ 'port' ]) $aDSNInfo [ 'port' ] = 5432 ;
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'create-db' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
echo " Create DB \n " ;
$bDidSomething = true ;
$oDB = DB :: connect ( CONST_Database_DSN , false );
2016-09-08 04:16:22 +03:00
if ( ! PEAR :: isError ( $oDB )) {
2016-09-04 04:19:48 +03:00
fail ( 'database already exists (' . CONST_Database_DSN . ')' );
}
passthruCheckReturn ( 'createdb -E UTF-8 -p ' . $aDSNInfo [ 'port' ] . ' ' . $aDSNInfo [ 'database' ]);
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'setup-db' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
echo " Setup DB \n " ;
$bDidSomething = true ;
2016-09-14 04:16:46 +03:00
// TODO: path detection, detection memory, etc.
//
2016-09-04 04:19:48 +03:00
$oDB =& getDB ();
$fPostgresVersion = getPostgresVersion ( $oDB );
echo 'Postgres version found: ' . $fPostgresVersion . " \n " ;
2016-09-08 04:16:22 +03:00
if ( $fPostgresVersion < 9.1 ) {
2016-09-04 04:19:48 +03:00
fail ( " Minimum supported version of Postgresql is 9.1. " );
}
pgsqlRunScript ( 'CREATE EXTENSION IF NOT EXISTS hstore' );
pgsqlRunScript ( 'CREATE EXTENSION IF NOT EXISTS postgis' );
// For extratags and namedetails the hstore_to_json converter is
// needed which is only available from Postgresql 9.3+. For older
// versions add a dummy function that returns nothing.
$iNumFunc = chksql ( $oDB -> getOne ( " select count(*) from pg_proc where proname = 'hstore_to_json' " ));
2016-09-08 04:16:22 +03:00
if ( $iNumFunc == 0 ) {
2016-09-04 04:19:48 +03:00
pgsqlRunScript ( " create function hstore_to_json(dummy hstore) returns text AS 'select null::text' language sql immutable " );
echo " WARNING: Postgresql is too old. extratags and namedetails API not available. " ;
}
$fPostgisVersion = getPostgisVersion ( $oDB );
echo 'Postgis version found: ' . $fPostgisVersion . " \n " ;
2016-09-08 04:16:22 +03:00
if ( $fPostgisVersion < 2.1 ) {
2016-10-09 21:09:59 +03:00
// Functions were renamed in 2.1 and throw an annoying deprecation warning
2016-09-04 04:19:48 +03:00
pgsqlRunScript ( 'ALTER FUNCTION st_line_interpolate_point(geometry, double precision) RENAME TO ST_LineInterpolatePoint' );
2016-10-24 21:39:49 +03:00
pgsqlRunScript ( 'ALTER FUNCTION ST_Line_Locate_Point(geometry, geometry) RENAME TO ST_LineLocatePoint' );
2016-10-09 21:09:59 +03:00
}
if ( $fPostgisVersion < 2.2 ) {
2016-10-24 21:39:49 +03:00
pgsqlRunScript ( 'ALTER FUNCTION ST_Distance_Spheroid(geometry, geometry, spheroid) RENAME TO ST_DistanceSpheroid' );
2016-09-04 04:19:48 +03:00
}
2017-05-13 00:02:50 +03:00
if ( ! file_exists ( CONST_ExtraDataPath . '/country_osm_grid.sql.gz' )) {
echo " Error: you need to download the country_osm_grid first: " ;
echo " \n wget -O " . CONST_ExtraDataPath . " /country_osm_grid.sql.gz http://www.nominatim.org/data/country_grid.sql.gz \n " ;
exit ( 1 );
}
2016-09-04 04:19:48 +03:00
pgsqlRunScriptFile ( CONST_BasePath . '/data/country_name.sql' );
pgsqlRunScriptFile ( CONST_BasePath . '/data/country_naturalearthdata.sql' );
2017-05-13 00:02:50 +03:00
pgsqlRunScriptFile ( CONST_BasePath . '/data/country_osm_grid.sql.gz' );
2016-09-04 04:19:48 +03:00
pgsqlRunScriptFile ( CONST_BasePath . '/data/gb_postcode_table.sql' );
2016-09-08 04:16:22 +03:00
if ( file_exists ( CONST_BasePath . '/data/gb_postcode_data.sql.gz' )) {
2016-09-04 04:19:48 +03:00
pgsqlRunScriptFile ( CONST_BasePath . '/data/gb_postcode_data.sql.gz' );
2016-09-08 04:16:22 +03:00
} else {
2016-09-04 04:19:48 +03:00
echo " WARNING: external UK postcode table not found. \n " ;
}
2016-09-08 04:16:22 +03:00
if ( CONST_Use_Extra_US_Postcodes ) {
2016-09-04 04:19:48 +03:00
pgsqlRunScriptFile ( CONST_BasePath . '/data/us_postcode.sql' );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'no-partitions' ]) {
2016-09-04 04:19:48 +03:00
pgsqlRunScript ( 'update country_name set partition = 0' );
}
// the following will be needed by create_functions later but
// is only defined in the subsequently called create_tables.
// Create dummies here that will be overwritten by the proper
// versions in create-tables.
pgsqlRunScript ( 'CREATE TABLE place_boundingbox ()' );
pgsqlRunScript ( 'create type wikipedia_article_match as ()' );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'import-data' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
echo " Import \n " ;
$bDidSomething = true ;
$osm2pgsql = CONST_Osm2pgsql_Binary ;
2016-09-08 04:16:22 +03:00
if ( ! file_exists ( $osm2pgsql )) {
2016-10-09 22:04:53 +03:00
echo " Check CONST_Osm2pgsql_Binary in your local settings file. \n " ;
echo " Normally you should not need to set this manually. \n " ;
2016-09-04 04:19:48 +03:00
fail ( " osm2pgsql not found in ' $osm2pgsql ' " );
}
2016-09-08 04:16:22 +03:00
if ( ! is_null ( CONST_Osm2pgsql_Flatnode_File )) {
2016-09-04 04:19:48 +03:00
$osm2pgsql .= ' --flat-nodes ' . CONST_Osm2pgsql_Flatnode_File ;
}
if ( CONST_Tablespace_Osm2pgsql_Data )
$osm2pgsql .= ' --tablespace-slim-data ' . CONST_Tablespace_Osm2pgsql_Data ;
if ( CONST_Tablespace_Osm2pgsql_Index )
$osm2pgsql .= ' --tablespace-slim-index ' . CONST_Tablespace_Osm2pgsql_Index ;
if ( CONST_Tablespace_Place_Data )
$osm2pgsql .= ' --tablespace-main-data ' . CONST_Tablespace_Place_Data ;
if ( CONST_Tablespace_Place_Index )
$osm2pgsql .= ' --tablespace-main-index ' . CONST_Tablespace_Place_Index ;
$osm2pgsql .= ' -lsc -O gazetteer --hstore --number-processes 1' ;
$osm2pgsql .= ' -C ' . $iCacheMemory ;
$osm2pgsql .= ' -P ' . $aDSNInfo [ 'port' ];
$osm2pgsql .= ' -d ' . $aDSNInfo [ 'database' ] . ' ' . $aCMDResult [ 'osm-file' ];
passthruCheckReturn ( $osm2pgsql );
$oDB =& getDB ();
2017-03-26 01:11:09 +03:00
if ( ! $aCMDResult [ 'ignore-errors' ] && ! chksql ( $oDB -> getRow ( 'select * from place limit 1' ))) {
2016-09-04 04:19:48 +03:00
fail ( 'No Data' );
}
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'create-functions' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
echo " Functions \n " ;
$bDidSomething = true ;
if ( ! file_exists ( CONST_InstallPath . '/module/nominatim.so' )) fail ( " nominatim module not built " );
create_sql_functions ( $aCMDResult );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'create-tables' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
$bDidSomething = true ;
echo " Tables \n " ;
$sTemplate = file_get_contents ( CONST_BasePath . '/sql/tables.sql' );
$sTemplate = str_replace ( '{www-user}' , CONST_Database_Web_User , $sTemplate );
2016-09-11 06:22:51 +03:00
$sTemplate = replace_tablespace (
'{ts:address-data}' ,
CONST_Tablespace_Address_Data ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:address-index}' ,
CONST_Tablespace_Address_Index ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:search-data}' ,
CONST_Tablespace_Search_Data ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:search-index}' ,
CONST_Tablespace_Search_Index ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:aux-data}' ,
CONST_Tablespace_Aux_Data ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:aux-index}' ,
CONST_Tablespace_Aux_Index ,
$sTemplate
);
2016-09-04 04:19:48 +03:00
pgsqlRunScript ( $sTemplate , false );
// re-run the functions
echo " Functions \n " ;
create_sql_functions ( $aCMDResult );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'create-partition-tables' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
echo " Partition Tables \n " ;
$bDidSomething = true ;
$sTemplate = file_get_contents ( CONST_BasePath . '/sql/partition-tables.src.sql' );
2016-09-11 06:22:51 +03:00
$sTemplate = replace_tablespace (
'{ts:address-data}' ,
CONST_Tablespace_Address_Data ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:address-index}' ,
CONST_Tablespace_Address_Index ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:search-data}' ,
CONST_Tablespace_Search_Data ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:search-index}' ,
CONST_Tablespace_Search_Index ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:aux-data}' ,
CONST_Tablespace_Aux_Data ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:aux-index}' ,
CONST_Tablespace_Aux_Index ,
$sTemplate
);
2016-09-04 04:19:48 +03:00
pgsqlRunPartitionScript ( $sTemplate );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'create-partition-functions' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
echo " Partition Functions \n " ;
$bDidSomething = true ;
$sTemplate = file_get_contents ( CONST_BasePath . '/sql/partition-functions.src.sql' );
pgsqlRunPartitionScript ( $sTemplate );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'import-wikipedia-articles' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
$bDidSomething = true ;
2016-12-29 01:38:17 +03:00
$sWikiArticlesFile = CONST_Wikipedia_Data_Path . '/wikipedia_article.sql.bin' ;
$sWikiRedirectsFile = CONST_Wikipedia_Data_Path . '/wikipedia_redirect.sql.bin' ;
2016-09-08 04:16:22 +03:00
if ( file_exists ( $sWikiArticlesFile )) {
2016-09-04 04:19:48 +03:00
echo " Importing wikipedia articles... " ;
pgsqlRunDropAndRestore ( $sWikiArticlesFile );
echo " ...done \n " ;
2016-09-08 04:16:22 +03:00
} else {
2016-09-04 04:19:48 +03:00
echo " WARNING: wikipedia article dump file not found - places will have default importance \n " ;
}
2016-09-08 04:16:22 +03:00
if ( file_exists ( $sWikiRedirectsFile )) {
2016-09-04 04:19:48 +03:00
echo " Importing wikipedia redirects... " ;
pgsqlRunDropAndRestore ( $sWikiRedirectsFile );
echo " ...done \n " ;
2016-09-08 04:16:22 +03:00
} else {
2016-09-04 04:19:48 +03:00
echo " WARNING: wikipedia redirect dump file not found - some place importance values may be missing \n " ;
}
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'load-data' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
echo " Drop old Data \n " ;
$bDidSomething = true ;
$oDB =& getDB ();
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE word' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE placex' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE location_property_osmline' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE place_addressline' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE place_boundingbox' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE location_area' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE search_name' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE search_name_blank' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'DROP SEQUENCE seq_place' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
if ( ! pg_query ( $oDB -> connection , 'CREATE SEQUENCE seq_place start 100000' )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
$sSQL = 'select distinct partition from country_name' ;
$aPartitions = chksql ( $oDB -> getCol ( $sSQL ));
if ( ! $aCMDResult [ 'no-partitions' ]) $aPartitions [] = 0 ;
2016-09-08 04:16:22 +03:00
foreach ( $aPartitions as $sPartition ) {
2016-09-04 04:19:48 +03:00
if ( ! pg_query ( $oDB -> connection , 'TRUNCATE location_road_' . $sPartition )) fail ( pg_last_error ( $oDB -> connection ));
echo '.' ;
}
// used by getorcreate_word_id to ignore frequent partial words
2016-10-14 01:01:16 +03:00
$sSQL = 'CREATE OR REPLACE FUNCTION get_maxwordfreq() RETURNS integer AS ' ;
$sSQL .= '$$ SELECT ' . CONST_Max_Word_Frequency . ' as maxwordfreq; $$ LANGUAGE SQL IMMUTABLE' ;
if ( ! pg_query ( $oDB -> connection , $sSQL )) {
fail ( pg_last_error ( $oDB -> connection ));
}
2016-09-04 04:19:48 +03:00
echo " . \n " ;
// pre-create the word list
2016-09-08 04:16:22 +03:00
if ( ! $aCMDResult [ 'disable-token-precalc' ]) {
2016-09-04 04:19:48 +03:00
echo " Loading word list \n " ;
pgsqlRunScriptFile ( CONST_BasePath . '/data/words.sql' );
}
echo " Load Data \n " ;
2017-04-14 16:50:27 +03:00
$sColumns = 'osm_type, osm_id, class, type, name, admin_level, address, extratags, geometry' ;
2016-09-04 04:19:48 +03:00
$aDBInstances = array ();
$iLoadThreads = max ( 1 , $iInstances - 1 );
2016-09-08 04:16:22 +03:00
for ( $i = 0 ; $i < $iLoadThreads ; $i ++ ) {
2016-09-04 04:19:48 +03:00
$aDBInstances [ $i ] =& getDB ( true );
2017-04-14 16:50:27 +03:00
$sSQL = " INSERT INTO placex ( $sColumns ) SELECT $sColumns FROM place WHERE osm_id % $iLoadThreads = $i " ;
2017-04-22 11:34:03 +03:00
$sSQL .= " and not (class='place' and type='houses' and osm_type='W' " ;
$sSQL .= " and ST_GeometryType(geometry) = 'ST_LineString') " ;
$sSQL .= " and ST_IsValid(geometry) " ;
2016-09-04 04:19:48 +03:00
if ( $aCMDResult [ 'verbose' ]) echo " $sSQL\n " ;
2017-04-18 23:29:21 +03:00
if ( ! pg_send_query ( $aDBInstances [ $i ] -> connection , $sSQL )) {
fail ( pg_last_error ( $aDBInstances [ $i ] -> connection ));
}
2016-09-04 04:19:48 +03:00
}
// last thread for interpolation lines
$aDBInstances [ $iLoadThreads ] =& getDB ( true );
2017-02-26 14:58:07 +03:00
$sSQL = 'insert into location_property_osmline' ;
2017-03-26 01:11:09 +03:00
$sSQL .= ' (osm_id, address, linegeo)' ;
$sSQL .= ' SELECT osm_id, address, geometry from place where ' ;
2016-09-04 04:19:48 +03:00
$sSQL .= " class='place' and type='houses' and osm_type='W' and ST_GeometryType(geometry) = 'ST_LineString' " ;
if ( $aCMDResult [ 'verbose' ]) echo " $sSQL\n " ;
2017-04-18 23:29:21 +03:00
if ( ! pg_send_query ( $aDBInstances [ $iLoadThreads ] -> connection , $sSQL )) {
2017-04-18 23:44:39 +03:00
fail ( pg_last_error ( $aDBInstances [ $iLoadThreads ] -> connection ));
2017-04-18 23:29:21 +03:00
}
2016-09-04 04:19:48 +03:00
$bAnyBusy = true ;
2016-09-08 04:16:22 +03:00
while ( $bAnyBusy ) {
2016-09-04 04:19:48 +03:00
$bAnyBusy = false ;
2016-09-08 04:16:22 +03:00
for ( $i = 0 ; $i <= $iLoadThreads ; $i ++ ) {
2016-09-04 04:19:48 +03:00
if ( pg_connection_busy ( $aDBInstances [ $i ] -> connection )) $bAnyBusy = true ;
}
sleep ( 1 );
echo '.' ;
}
echo " \n " ;
echo " Reanalysing database... \n " ;
pgsqlRunScript ( 'ANALYSE' );
2017-05-25 17:26:09 +03:00
$sDatabaseDate = getDatabaseDate ( $oDB );
pg_query ( $oDB -> connection , 'TRUNCATE import_status' );
2017-06-09 22:49:31 +03:00
if ( $sDatabaseDate === false ) {
echo " WARNING: could not determine database date. \n " ;
} else {
$sSQL = " INSERT INTO import_status (lastimportdate) VALUES(' " . $sDatabaseDate . " ') " ;
pg_query ( $oDB -> connection , $sSQL );
echo " Latest data imported from $sDatabaseDate . \n " ;
}
2016-09-04 04:19:48 +03:00
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'import-tiger-data' ]) {
2016-09-04 04:19:48 +03:00
$bDidSomething = true ;
$sTemplate = file_get_contents ( CONST_BasePath . '/sql/tiger_import_start.sql' );
$sTemplate = str_replace ( '{www-user}' , CONST_Database_Web_User , $sTemplate );
2016-09-11 06:22:51 +03:00
$sTemplate = replace_tablespace (
'{ts:aux-data}' ,
CONST_Tablespace_Aux_Data ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:aux-index}' ,
CONST_Tablespace_Aux_Index ,
$sTemplate
);
2016-09-04 04:19:48 +03:00
pgsqlRunScript ( $sTemplate , false );
$aDBInstances = array ();
2016-09-08 04:16:22 +03:00
for ( $i = 0 ; $i < $iInstances ; $i ++ ) {
2016-09-04 04:19:48 +03:00
$aDBInstances [ $i ] =& getDB ( true );
}
2016-09-08 04:16:22 +03:00
foreach ( glob ( CONST_Tiger_Data_Path . '/*.sql' ) as $sFile ) {
2016-09-04 04:19:48 +03:00
echo $sFile . ': ' ;
$hFile = fopen ( $sFile , " r " );
$sSQL = fgets ( $hFile , 100000 );
$iLines = 0 ;
2016-09-08 04:16:22 +03:00
while ( true ) {
for ( $i = 0 ; $i < $iInstances ; $i ++ ) {
if ( ! pg_connection_busy ( $aDBInstances [ $i ] -> connection )) {
while ( pg_get_result ( $aDBInstances [ $i ] -> connection ));
2016-09-04 04:19:48 +03:00
$sSQL = fgets ( $hFile , 100000 );
if ( ! $sSQL ) break 2 ;
if ( ! pg_send_query ( $aDBInstances [ $i ] -> connection , $sSQL )) fail ( pg_last_error ( $oDB -> connection ));
$iLines ++ ;
2016-09-08 04:16:22 +03:00
if ( $iLines == 1000 ) {
2016-09-04 04:19:48 +03:00
echo " . " ;
$iLines = 0 ;
}
}
}
usleep ( 10 );
}
fclose ( $hFile );
$bAnyBusy = true ;
2016-09-08 04:16:22 +03:00
while ( $bAnyBusy ) {
2016-09-04 04:19:48 +03:00
$bAnyBusy = false ;
2016-09-08 04:16:22 +03:00
for ( $i = 0 ; $i < $iInstances ; $i ++ ) {
2016-09-04 04:19:48 +03:00
if ( pg_connection_busy ( $aDBInstances [ $i ] -> connection )) $bAnyBusy = true ;
}
usleep ( 10 );
}
echo " \n " ;
}
echo " Creating indexes \n " ;
$sTemplate = file_get_contents ( CONST_BasePath . '/sql/tiger_import_finish.sql' );
$sTemplate = str_replace ( '{www-user}' , CONST_Database_Web_User , $sTemplate );
2016-09-11 06:22:51 +03:00
$sTemplate = replace_tablespace (
'{ts:aux-data}' ,
CONST_Tablespace_Aux_Data ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:aux-index}' ,
CONST_Tablespace_Aux_Index ,
$sTemplate
);
2016-09-04 04:19:48 +03:00
pgsqlRunScript ( $sTemplate , false );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'calculate-postcodes' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
$bDidSomething = true ;
$oDB =& getDB ();
if ( ! pg_query ( $oDB -> connection , 'DELETE from placex where osm_type=\'P\'' )) fail ( pg_last_error ( $oDB -> connection ));
2017-06-06 21:42:13 +03:00
$sSQL = " insert into placex (osm_type,osm_id,class,type,address,country_code,geometry) " ;
$sSQL .= " select 'P',nextval('seq_postcodes'),'place','postcode', " ;
$sSQL .= " hstore('postcode', pc),country_code, " ;
$sSQL .= " ST_SetSRID(ST_Point(x,y),4326) as geometry from (select country_code, " ;
$sSQL .= " address->'postcode' as pc, " ;
2016-09-04 04:19:48 +03:00
$sSQL .= " avg(st_x(st_centroid(geometry))) as x,avg(st_y(st_centroid(geometry))) as y " ;
2017-06-06 21:42:13 +03:00
$sSQL .= " from placex where address ? 'postcode' group by country_code,pc) as x " ;
2017-02-26 14:58:07 +03:00
$sSQL .= " where ST_Point(x,y) is not null " ;
2016-09-04 04:19:48 +03:00
if ( ! pg_query ( $oDB -> connection , $sSQL )) fail ( pg_last_error ( $oDB -> connection ));
2016-09-08 04:16:22 +03:00
if ( CONST_Use_Extra_US_Postcodes ) {
2017-06-06 21:42:13 +03:00
$sSQL = " insert into placex (osm_type,osm_id,class,type,address,country_code,geometry) " ;
$sSQL .= " select 'P',nextval('seq_postcodes'),'place','postcode', " ;
$sSQL .= " hstore('postcode', postcode),'us', " ;
2016-09-04 04:19:48 +03:00
$sSQL .= " ST_SetSRID(ST_Point(x,y),4326) as geometry from us_postcode " ;
if ( ! pg_query ( $oDB -> connection , $sSQL )) fail ( pg_last_error ( $oDB -> connection ));
}
}
2017-05-25 17:26:09 +03:00
if ( $aCMDResult [ 'osmosis-init' ]) {
2016-09-04 04:19:48 +03:00
$bDidSomething = true ;
2017-05-25 17:26:09 +03:00
echo " Command 'osmosis-init' no longer available, please use utils/update.php --init-updates. \n " ;
2016-09-04 04:19:48 +03:00
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'index' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
$bDidSomething = true ;
$sOutputFile = '' ;
$sBaseCmd = CONST_InstallPath . '/nominatim/nominatim -i -d ' . $aDSNInfo [ 'database' ] . ' -P ' . $aDSNInfo [ 'port' ] . ' -t ' . $iInstances . $sOutputFile ;
passthruCheckReturn ( $sBaseCmd . ' -R 4' );
if ( ! $aCMDResult [ 'index-noanalyse' ]) pgsqlRunScript ( 'ANALYSE' );
passthruCheckReturn ( $sBaseCmd . ' -r 5 -R 25' );
if ( ! $aCMDResult [ 'index-noanalyse' ]) pgsqlRunScript ( 'ANALYSE' );
passthruCheckReturn ( $sBaseCmd . ' -r 26' );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'create-search-indices' ] || $aCMDResult [ 'all' ]) {
2016-09-04 04:19:48 +03:00
echo " Search indices \n " ;
$bDidSomething = true ;
$sTemplate = file_get_contents ( CONST_BasePath . '/sql/indices.src.sql' );
2016-09-11 06:22:51 +03:00
$sTemplate = replace_tablespace (
'{ts:address-index}' ,
CONST_Tablespace_Address_Index ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:search-index}' ,
CONST_Tablespace_Search_Index ,
$sTemplate
);
$sTemplate = replace_tablespace (
'{ts:aux-index}' ,
CONST_Tablespace_Aux_Index ,
$sTemplate
);
2016-09-04 04:19:48 +03:00
pgsqlRunScript ( $sTemplate );
}
2016-09-29 00:30:44 +03:00
if ( $aCMDResult [ 'create-country-names' ] || $aCMDResult [ 'all' ]) {
echo 'Creating search index for default country names' ;
$bDidSomething = true ;
pgsqlRunScript ( " select getorcreate_country(make_standard_name('uk'), 'gb') " );
pgsqlRunScript ( " select getorcreate_country(make_standard_name('united states'), 'us') " );
pgsqlRunScript ( " select count(*) from (select getorcreate_country(make_standard_name(country_code), country_code) from country_name where country_code is not null) as x " );
pgsqlRunScript ( " select count(*) from (select getorcreate_country(make_standard_name(name->'name'), country_code) from country_name where name ? 'name') as x " );
$sSQL = 'select count(*) from (select getorcreate_country(make_standard_name(v), country_code) from (select country_code, skeys(name) as k, svals(name) as v from country_name) x where k ' ;
if ( CONST_Languages ) {
$sSQL .= 'in ' ;
$sDelim = '(' ;
foreach ( explode ( ',' , CONST_Languages ) as $sLang ) {
$sSQL .= $sDelim . " 'name: $sLang ' " ;
$sDelim = ',' ;
}
$sSQL .= ')' ;
} else {
// all include all simple name tags
$sSQL .= " like 'name:%' " ;
}
$sSQL .= ') v' ;
pgsqlRunScript ( $sSQL );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'drop' ]) {
2016-09-04 04:19:48 +03:00
// The implementation is potentially a bit dangerous because it uses
// a positive selection of tables to keep, and deletes everything else.
// Including any tables that the unsuspecting user might have manually
// created. USE AT YOUR OWN PERIL.
$bDidSomething = true ;
// tables we want to keep. everything else goes.
$aKeepTables = array (
2016-09-10 22:10:52 +03:00
" *columns " ,
" import_polygon_* " ,
" import_status " ,
" place_addressline " ,
" location_property* " ,
" placex " ,
" search_name " ,
" seq_* " ,
" word " ,
" query_log " ,
" new_query_log " ,
" gb_postcode " ,
" spatial_ref_sys " ,
" country_name " ,
" place_classtype_* "
);
2016-09-04 04:19:48 +03:00
$oDB =& getDB ();
$aDropTables = array ();
$aHaveTables = chksql ( $oDB -> getCol ( " SELECT tablename FROM pg_tables WHERE schemaname='public' " ));
2016-09-08 04:16:22 +03:00
foreach ( $aHaveTables as $sTable ) {
2016-09-04 04:19:48 +03:00
$bFound = false ;
2016-09-08 04:16:22 +03:00
foreach ( $aKeepTables as $sKeep ) {
if ( fnmatch ( $sKeep , $sTable )) {
2016-09-04 04:19:48 +03:00
$bFound = true ;
break ;
}
}
if ( ! $bFound ) array_push ( $aDropTables , $sTable );
}
2016-09-08 04:16:22 +03:00
foreach ( $aDropTables as $sDrop ) {
2016-09-04 04:19:48 +03:00
if ( $aCMDResult [ 'verbose' ]) echo " dropping table $sDrop\n " ;
@ pg_query ( $oDB -> connection , " DROP TABLE $sDrop CASCADE " );
// ignore warnings/errors as they might be caused by a table having
// been deleted already by CASCADE
}
2016-09-08 04:16:22 +03:00
if ( ! is_null ( CONST_Osm2pgsql_Flatnode_File )) {
2016-09-04 04:19:48 +03:00
if ( $aCMDResult [ 'verbose' ]) echo " deleting " . CONST_Osm2pgsql_Flatnode_File . " \n " ;
unlink ( CONST_Osm2pgsql_Flatnode_File );
}
}
2016-09-08 04:16:22 +03:00
if ( ! $bDidSomething ) {
2016-09-04 04:19:48 +03:00
showUsage ( $aCMDOptions , true );
2016-09-08 04:16:22 +03:00
} else {
2016-09-04 04:19:48 +03:00
echo " Setup finished. \n " ;
}
2016-09-14 04:16:46 +03:00
2016-09-04 04:19:48 +03:00
function pgsqlRunScriptFile ( $sFilename )
{
if ( ! file_exists ( $sFilename )) fail ( 'unable to find ' . $sFilename );
// Convert database DSN to psql parameters
$aDSNInfo = DB :: parseDSN ( CONST_Database_DSN );
if ( ! isset ( $aDSNInfo [ 'port' ]) || ! $aDSNInfo [ 'port' ]) $aDSNInfo [ 'port' ] = 5432 ;
$sCMD = 'psql -p ' . $aDSNInfo [ 'port' ] . ' -d ' . $aDSNInfo [ 'database' ];
$ahGzipPipes = null ;
2016-09-08 04:16:22 +03:00
if ( preg_match ( '/\\.gz$/' , $sFilename )) {
2016-09-04 04:19:48 +03:00
$aDescriptors = array (
2016-09-10 22:10:52 +03:00
0 => array ( 'pipe' , 'r' ),
1 => array ( 'pipe' , 'w' ),
2 => array ( 'file' , '/dev/null' , 'a' )
);
2016-09-04 04:19:48 +03:00
$hGzipProcess = proc_open ( 'zcat ' . $sFilename , $aDescriptors , $ahGzipPipes );
if ( ! is_resource ( $hGzipProcess )) fail ( 'unable to start zcat' );
$aReadPipe = $ahGzipPipes [ 1 ];
fclose ( $ahGzipPipes [ 0 ]);
2016-09-08 04:16:22 +03:00
} else {
2016-09-04 04:19:48 +03:00
$sCMD .= ' -f ' . $sFilename ;
$aReadPipe = array ( 'pipe' , 'r' );
}
$aDescriptors = array (
2016-09-10 22:10:52 +03:00
0 => $aReadPipe ,
1 => array ( 'pipe' , 'w' ),
2 => array ( 'file' , '/dev/null' , 'a' )
);
2016-09-04 04:19:48 +03:00
$ahPipes = null ;
$hProcess = proc_open ( $sCMD , $aDescriptors , $ahPipes );
if ( ! is_resource ( $hProcess )) fail ( 'unable to start pgsql' );
// TODO: error checking
2016-09-08 04:16:22 +03:00
while ( ! feof ( $ahPipes [ 1 ])) {
2016-09-04 04:19:48 +03:00
echo fread ( $ahPipes [ 1 ], 4096 );
}
fclose ( $ahPipes [ 1 ]);
$iReturn = proc_close ( $hProcess );
2016-09-08 04:16:22 +03:00
if ( $iReturn > 0 ) {
2016-09-04 04:19:48 +03:00
fail ( " pgsql returned with error code ( $iReturn ) " );
}
2016-09-08 04:16:22 +03:00
if ( $ahGzipPipes ) {
2016-09-04 04:19:48 +03:00
fclose ( $ahGzipPipes [ 1 ]);
proc_close ( $hGzipProcess );
}
}
function pgsqlRunScript ( $sScript , $bfatal = true )
{
global $aCMDResult ;
// Convert database DSN to psql parameters
$aDSNInfo = DB :: parseDSN ( CONST_Database_DSN );
if ( ! isset ( $aDSNInfo [ 'port' ]) || ! $aDSNInfo [ 'port' ]) $aDSNInfo [ 'port' ] = 5432 ;
$sCMD = 'psql -p ' . $aDSNInfo [ 'port' ] . ' -d ' . $aDSNInfo [ 'database' ];
if ( $bfatal && ! $aCMDResult [ 'ignore-errors' ])
$sCMD .= ' -v ON_ERROR_STOP=1' ;
$aDescriptors = array (
2016-09-10 22:10:52 +03:00
0 => array ( 'pipe' , 'r' ),
2016-09-14 04:16:46 +03:00
1 => STDOUT ,
2016-09-10 22:10:52 +03:00
2 => STDERR
);
2016-09-04 04:19:48 +03:00
$ahPipes = null ;
$hProcess = @ proc_open ( $sCMD , $aDescriptors , $ahPipes );
if ( ! is_resource ( $hProcess )) fail ( 'unable to start pgsql' );
2016-09-08 04:16:22 +03:00
while ( strlen ( $sScript )) {
2016-09-04 04:19:48 +03:00
$written = fwrite ( $ahPipes [ 0 ], $sScript );
if ( $written <= 0 ) break ;
$sScript = substr ( $sScript , $written );
}
fclose ( $ahPipes [ 0 ]);
$iReturn = proc_close ( $hProcess );
2016-09-08 04:16:22 +03:00
if ( $bfatal && $iReturn > 0 ) {
2016-09-04 04:19:48 +03:00
fail ( " pgsql returned with error code ( $iReturn ) " );
}
}
function pgsqlRunPartitionScript ( $sTemplate )
{
global $aCMDResult ;
$oDB =& getDB ();
$sSQL = 'select distinct partition from country_name' ;
$aPartitions = chksql ( $oDB -> getCol ( $sSQL ));
if ( ! $aCMDResult [ 'no-partitions' ]) $aPartitions [] = 0 ;
preg_match_all ( '#^-- start(.*?)^-- end#ms' , $sTemplate , $aMatches , PREG_SET_ORDER );
2016-09-08 04:16:22 +03:00
foreach ( $aMatches as $aMatch ) {
2016-09-04 04:19:48 +03:00
$sResult = '' ;
2016-09-08 04:16:22 +03:00
foreach ( $aPartitions as $sPartitionName ) {
2016-09-04 04:19:48 +03:00
$sResult .= str_replace ( '-partition-' , $sPartitionName , $aMatch [ 1 ]);
}
$sTemplate = str_replace ( $aMatch [ 0 ], $sResult , $sTemplate );
}
pgsqlRunScript ( $sTemplate );
}
function pgsqlRunRestoreData ( $sDumpFile )
{
// Convert database DSN to psql parameters
$aDSNInfo = DB :: parseDSN ( CONST_Database_DSN );
if ( ! isset ( $aDSNInfo [ 'port' ]) || ! $aDSNInfo [ 'port' ]) $aDSNInfo [ 'port' ] = 5432 ;
$sCMD = 'pg_restore -p ' . $aDSNInfo [ 'port' ] . ' -d ' . $aDSNInfo [ 'database' ] . ' -Fc -a ' . $sDumpFile ;
$aDescriptors = array (
2016-09-10 22:10:52 +03:00
0 => array ( 'pipe' , 'r' ),
1 => array ( 'pipe' , 'w' ),
2 => array ( 'file' , '/dev/null' , 'a' )
);
2016-09-04 04:19:48 +03:00
$ahPipes = null ;
$hProcess = proc_open ( $sCMD , $aDescriptors , $ahPipes );
if ( ! is_resource ( $hProcess )) fail ( 'unable to start pg_restore' );
fclose ( $ahPipes [ 0 ]);
// TODO: error checking
2016-09-08 04:16:22 +03:00
while ( ! feof ( $ahPipes [ 1 ])) {
2016-09-04 04:19:48 +03:00
echo fread ( $ahPipes [ 1 ], 4096 );
}
fclose ( $ahPipes [ 1 ]);
$iReturn = proc_close ( $hProcess );
}
function pgsqlRunDropAndRestore ( $sDumpFile )
{
// Convert database DSN to psql parameters
$aDSNInfo = DB :: parseDSN ( CONST_Database_DSN );
if ( ! isset ( $aDSNInfo [ 'port' ]) || ! $aDSNInfo [ 'port' ]) $aDSNInfo [ 'port' ] = 5432 ;
$sCMD = 'pg_restore -p ' . $aDSNInfo [ 'port' ] . ' -d ' . $aDSNInfo [ 'database' ] . ' -Fc --clean ' . $sDumpFile ;
$aDescriptors = array (
2016-09-10 22:10:52 +03:00
0 => array ( 'pipe' , 'r' ),
1 => array ( 'pipe' , 'w' ),
2 => array ( 'file' , '/dev/null' , 'a' )
);
2016-09-04 04:19:48 +03:00
$ahPipes = null ;
$hProcess = proc_open ( $sCMD , $aDescriptors , $ahPipes );
if ( ! is_resource ( $hProcess )) fail ( 'unable to start pg_restore' );
fclose ( $ahPipes [ 0 ]);
// TODO: error checking
2016-09-08 04:16:22 +03:00
while ( ! feof ( $ahPipes [ 1 ])) {
2016-09-04 04:19:48 +03:00
echo fread ( $ahPipes [ 1 ], 4096 );
}
fclose ( $ahPipes [ 1 ]);
$iReturn = proc_close ( $hProcess );
}
function passthruCheckReturn ( $cmd )
{
$result = - 1 ;
passthru ( $cmd , $result );
if ( $result != 0 ) fail ( 'Error executing external command: ' . $cmd );
}
function replace_tablespace ( $sTemplate , $sTablespace , $sSql )
{
2016-09-08 04:16:22 +03:00
if ( $sTablespace ) {
2016-09-11 06:22:51 +03:00
$sSql = str_replace ( $sTemplate , 'TABLESPACE "' . $sTablespace . '"' , $sSql );
2016-09-08 04:16:22 +03:00
} else {
2016-09-04 04:19:48 +03:00
$sSql = str_replace ( $sTemplate , '' , $sSql );
2016-09-08 04:16:22 +03:00
}
2016-09-04 04:19:48 +03:00
return $sSql ;
}
function create_sql_functions ( $aCMDResult )
{
$sTemplate = file_get_contents ( CONST_BasePath . '/sql/functions.sql' );
$sTemplate = str_replace ( '{modulepath}' , CONST_InstallPath . '/module' , $sTemplate );
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'enable-diff-updates' ]) {
2016-09-04 04:19:48 +03:00
$sTemplate = str_replace ( 'RETURN NEW; -- %DIFFUPDATES%' , '--' , $sTemplate );
}
2016-09-08 04:16:22 +03:00
if ( $aCMDResult [ 'enable-debug-statements' ]) {
2016-09-04 04:19:48 +03:00
$sTemplate = str_replace ( '--DEBUG:' , '' , $sTemplate );
}
2016-09-08 04:16:22 +03:00
if ( CONST_Limit_Reindexing ) {
2016-09-04 04:19:48 +03:00
$sTemplate = str_replace ( '--LIMIT INDEXING:' , '' , $sTemplate );
}
2016-09-08 04:16:22 +03:00
if ( ! CONST_Use_US_Tiger_Data ) {
2016-09-04 04:19:48 +03:00
$sTemplate = str_replace ( '-- %NOTIGERDATA% ' , '' , $sTemplate );
}
2016-09-08 04:16:22 +03:00
if ( ! CONST_Use_Aux_Location_data ) {
2016-09-04 04:19:48 +03:00
$sTemplate = str_replace ( '-- %NOAUXDATA% ' , '' , $sTemplate );
}
pgsqlRunScript ( $sTemplate );
}