2011-03-18 15:36:17 +03:00
#!/usr/bin/php -Cq
< ? php
2011-04-27 16:14:33 +04:00
2016-03-09 02:07:46 +03:00
require_once ( dirname ( dirname ( __FILE__ )) . '/settings/settings.php' );
require_once ( CONST_BasePath . '/lib/init-cmd.php' );
ini_set ( 'memory_limit' , '800M' );
2011-03-18 15:36:17 +03:00
$aCMDOptions = array (
" Import / update / index osm data " ,
array ( 'help' , 'h' , 0 , 1 , 0 , 0 , false , 'Show Help' ),
array ( 'quiet' , 'q' , 0 , 1 , 0 , 0 , 'bool' , 'Quiet output' ),
array ( 'verbose' , 'v' , 0 , 1 , 0 , 0 , 'bool' , 'Verbose output' ),
array ( 'max-load' , '' , 0 , 1 , 1 , 1 , 'float' , 'Maximum load average - indexing is paused if this is exceeded' ),
array ( 'max-blocking' , '' , 0 , 1 , 1 , 1 , 'int' , 'Maximum blocking processes - indexing is aborted / paused if this is exceeded' ),
array ( 'import-osmosis' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import using osmosis' ),
array ( 'import-osmosis-all' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import using osmosis forever' ),
2012-05-22 18:27:42 +04:00
array ( 'no-npi' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Do not write npi index files' ),
array ( 'no-index' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Do not index the new data' ),
2011-03-18 15:36:17 +03:00
array ( 'import-npi-all' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import npi pre-indexed files' ),
array ( 'import-hourly' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import hourly diffs' ),
array ( 'import-daily' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import daily diffs' ),
array ( 'import-all' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Import all available files' ),
array ( 'import-file' , '' , 0 , 1 , 1 , 1 , 'realpath' , 'Re-import data from an OSM file' ),
array ( 'import-diff' , '' , 0 , 1 , 1 , 1 , 'realpath' , 'Import a diff (osc) file from local file system' ),
2013-09-16 01:10:26 +04:00
array ( 'osm2pgsql-cache' , '' , 0 , 1 , 1 , 1 , 'int' , 'Cache size used by osm2pgsql' ),
2011-03-18 15:36:17 +03:00
array ( 'import-node' , '' , 0 , 1 , 1 , 1 , 'int' , 'Re-import node' ),
array ( 'import-way' , '' , 0 , 1 , 1 , 1 , 'int' , 'Re-import way' ),
array ( 'import-relation' , '' , 0 , 1 , 1 , 1 , 'int' , 'Re-import relation' ),
2012-05-23 00:23:46 +04:00
array ( 'import-from-main-api' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Use OSM API instead of Overpass to download objects' ),
2011-03-18 15:36:17 +03:00
array ( 'index' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Index' ),
array ( 'index-rank' , '' , 0 , 1 , 1 , 1 , 'int' , 'Rank to start indexing from' ),
array ( 'index-instances' , '' , 0 , 1 , 1 , 1 , 'int' , 'Number of indexing instances (threads)' ),
array ( 'index-estrate' , '' , 0 , 1 , 1 , 1 , 'int' , 'Estimated indexed items per second (def:30)' ),
array ( 'deduplicate' , '' , 0 , 1 , 0 , 0 , 'bool' , 'Deduplicate tokens' ),
);
getCmdOpt ( $_SERVER [ 'argv' ], $aCMDOptions , $aResult , true , true );
if ( $aResult [ 'import-hourly' ] + $aResult [ 'import-daily' ] + isset ( $aResult [ 'import-diff' ]) > 1 )
{
showUsage ( $aCMDOptions , true , 'Select either import of hourly or daily' );
}
if ( ! isset ( $aResult [ 'index-instances' ])) $aResult [ 'index-instances' ] = 1 ;
2012-05-22 23:05:31 +04:00
if ( ! isset ( $aResult [ 'index-rank' ])) $aResult [ 'index-rank' ] = 0 ;
2013-09-16 01:10:26 +04:00
2011-03-18 15:36:17 +03:00
/*
// Lock to prevent multiple copies running
if ( exec ( '/bin/ps uww | grep ' . basename ( __FILE__ ) . ' | grep -v /dev/null | grep -v grep -c' , $aOutput2 , $iResult ) > 1 )
{
2015-12-07 16:08:02 +03:00
fail ( " Copy already running \n " );
2011-03-18 15:36:17 +03:00
}
if ( ! isset ( $aResult [ 'max-load' ])) $aResult [ 'max-load' ] = 1.9 ;
if ( ! isset ( $aResult [ 'max-blocking' ])) $aResult [ 'max-blocking' ] = 3 ;
if ( getBlockingProcesses () > $aResult [ 'max-blocking' ])
{
2015-12-07 16:08:02 +03:00
fail ( " Too many blocking processes for import \n " );
2011-03-18 15:36:17 +03:00
}
*/
2012-12-09 01:42:12 +04:00
date_default_timezone_set ( 'Etc/UTC' );
2011-03-18 15:36:17 +03:00
$oDB =& getDB ();
2012-04-20 20:29:14 +04:00
$aDSNInfo = DB :: parseDSN ( CONST_Database_DSN );
2013-11-14 01:24:10 +04:00
if ( ! isset ( $aDSNInfo [ 'port' ]) || ! $aDSNInfo [ 'port' ]) $aDSNInfo [ 'port' ] = 5432 ;
2012-04-20 20:29:14 +04:00
2013-09-16 01:10:26 +04:00
// cache memory to be used by osm2pgsql, should not be more than the available memory
$iCacheMemory = ( isset ( $aResult [ 'osm2pgsql-cache' ]) ? $aResult [ 'osm2pgsql-cache' ] : 2000 );
if ( $iCacheMemory + 500 > getTotalMemoryMB ())
{
$iCacheMemory = getCacheMemoryMB ();
echo " WARNING: resetting cache memory to $iCacheMemory\n " ;
}
2015-08-29 14:14:11 +03:00
$sOsm2pgsqlCmd = CONST_Osm2pgsql_Binary . ' -klas --number-processes 1 -C ' . $iCacheMemory . ' -O gazetteer -d ' . $aDSNInfo [ 'database' ] . ' -P ' . $aDSNInfo [ 'port' ];
2013-09-16 01:10:26 +04:00
if ( ! is_null ( CONST_Osm2pgsql_Flatnode_File ))
{
$sOsm2pgsqlCmd .= ' --flat-nodes ' . CONST_Osm2pgsql_Flatnode_File ;
}
2011-03-18 15:36:17 +03:00
$bFirst = true ;
$bContinue = $aResult [ 'import-all' ];
while ( $bContinue || $bFirst )
{
$bFirst = false ;
if ( $aResult [ 'import-hourly' ])
{
// Mirror the hourly diffs
exec ( 'wget --quiet --mirror -l 1 -P ' . $sMirrorDir . ' http://planet.openstreetmap.org/hourly' );
$sNextFile = $oDB -> getOne ( 'select TO_CHAR(lastimportdate,\'YYYYMMDDHH24\')||\'-\'||TO_CHAR(lastimportdate+\'1 hour\'::interval,\'YYYYMMDDHH24\')||\'.osc.gz\' from import_status' );
$sNextFile = $sMirrorDir . 'planet.openstreetmap.org/hourly/' . $sNextFile ;
$sUpdateSQL = 'update import_status set lastimportdate = lastimportdate+\'1 hour\'::interval' ;
}
if ( $aResult [ 'import-daily' ])
{
// Mirror the daily diffs
exec ( 'wget --quiet --mirror -l 1 -P ' . $sMirrorDir . ' http://planet.openstreetmap.org/daily' );
$sNextFile = $oDB -> getOne ( 'select TO_CHAR(lastimportdate,\'YYYYMMDD\')||\'-\'||TO_CHAR(lastimportdate+\'1 day\'::interval,\'YYYYMMDD\')||\'.osc.gz\' from import_status' );
$sNextFile = $sMirrorDir . 'planet.openstreetmap.org/daily/' . $sNextFile ;
$sUpdateSQL = 'update import_status set lastimportdate = lastimportdate::date + 1' ;
}
if ( isset ( $aResult [ 'import-diff' ]))
{
// import diff directly (e.g. from osmosis --rri)
$sNextFile = $aResult [ 'import-diff' ];
2012-04-20 20:29:14 +04:00
if ( ! file_exists ( $sNextFile ))
2011-03-18 15:36:17 +03:00
{
2015-12-07 16:08:02 +03:00
fail ( " Cannot open $sNextFile\n " );
2011-03-18 15:36:17 +03:00
}
// Don't update the import status - we don't know what this file contains
$sUpdateSQL = 'update import_status set lastimportdate = now() where false' ;
}
// Missing file is not an error - it might not be created yet
2012-04-20 20:29:14 +04:00
if (( $aResult [ 'import-hourly' ] || $aResult [ 'import-daily' ] || isset ( $aResult [ 'import-diff' ])) && file_exists ( $sNextFile ))
2011-03-18 15:36:17 +03:00
{
// Import the file
2013-09-16 01:10:26 +04:00
$sCMD = $sOsm2pgsqlCmd . ' ' . $sNextFile ;
2011-03-18 15:36:17 +03:00
echo $sCMD . " \n " ;
exec ( $sCMD , $sJunk , $iErrorLevel );
if ( $iErrorLevel )
{
2015-12-07 16:08:02 +03:00
fail ( " Error from osm2pgsql, $iErrorLevel\n " );
2011-03-18 15:36:17 +03:00
}
// Move the date onwards
$oDB -> query ( $sUpdateSQL );
}
else
{
$bContinue = false ;
}
}
2012-04-20 20:29:14 +04:00
$bModifyXML = false ;
$sModifyXMLstr = '' ;
2012-05-23 00:23:46 +04:00
$bUseOSMApi = isset ( $aResult [ 'import-from-main-api' ]) && $aResult [ 'import-from-main-api' ];
2011-03-18 15:36:17 +03:00
if ( isset ( $aResult [ 'import-file' ]) && $aResult [ 'import-file' ])
{
2012-04-20 20:29:14 +04:00
$bModifyXML = true ;
2011-03-18 15:36:17 +03:00
}
if ( isset ( $aResult [ 'import-node' ]) && $aResult [ 'import-node' ])
{
2012-04-20 20:29:14 +04:00
$bModifyXML = true ;
2012-05-23 00:23:46 +04:00
if ( $bUseOSMApi )
{
$sModifyXMLstr = file_get_contents ( 'http://www.openstreetmap.org/api/0.6/node/' . $aResult [ 'import-node' ]);
}
else
{
2013-02-26 23:42:57 +04:00
$sModifyXMLstr = file_get_contents ( 'http://overpass-api.de/api/interpreter?data=node(' . $aResult [ 'import-node' ] . ');out%20meta;' );
2012-05-23 00:23:46 +04:00
}
2011-03-18 15:36:17 +03:00
}
if ( isset ( $aResult [ 'import-way' ]) && $aResult [ 'import-way' ])
{
2012-04-20 20:29:14 +04:00
$bModifyXML = true ;
2012-05-23 00:23:46 +04:00
if ( $bUseOSMApi )
{
$sCmd = 'http://www.openstreetmap.org/api/0.6/way/' . $aResult [ 'import-way' ] . '/full' ;
}
else
{
2013-02-26 23:42:57 +04:00
$sCmd = 'http://overpass-api.de/api/interpreter?data=(way(' . $aResult [ 'import-way' ] . ');node(w););out%20meta;' ;
2012-05-23 00:23:46 +04:00
}
$sModifyXMLstr = file_get_contents ( $sCmd );
2011-03-18 15:36:17 +03:00
}
if ( isset ( $aResult [ 'import-relation' ]) && $aResult [ 'import-relation' ])
{
2012-04-20 20:29:14 +04:00
$bModifyXML = true ;
2012-05-23 00:23:46 +04:00
if ( $bUseOSMApi )
{
$sModifyXMLstr = file_get_contents ( 'http://www.openstreetmap.org/api/0.6/relation/' . $aResult [ 'import-relation' ] . '/full' );
}
else
{
2013-02-26 23:42:57 +04:00
$sModifyXMLstr = file_get_contents ( 'http://overpass-api.de/api/interpreter?data=((rel(' . $aResult [ 'import-relation' ] . ');way(r);node(w));node(r));out%20meta;' );
2012-05-23 00:23:46 +04:00
}
2011-03-18 15:36:17 +03:00
}
2012-04-20 20:29:14 +04:00
if ( $bModifyXML )
2011-03-18 15:36:17 +03:00
{
2012-04-20 20:29:14 +04:00
// derive change from normal osm file with osmosis
$sTemporaryFile = CONST_BasePath . '/data/osmosischange.osc' ;
2012-05-05 12:56:31 +04:00
if ( isset ( $aResult [ 'import-file' ]) && $aResult [ 'import-file' ])
2012-04-20 20:29:14 +04:00
{
$sCMD = CONST_Osmosis_Binary . ' --read-xml \'' . $aResult [ 'import-file' ] . '\' --read-empty --derive-change --write-xml-change ' . $sTemporaryFile ;
echo $sCMD . " \n " ;
exec ( $sCMD , $sJunk , $iErrorLevel );
if ( $iErrorLevel )
{
2015-12-07 16:08:02 +03:00
fail ( " Error converting osm to osc, osmosis returned: $iErrorLevel\n " );
2012-04-20 20:29:14 +04:00
}
}
else
2011-03-18 15:36:17 +03:00
{
2012-04-20 20:29:14 +04:00
$aSpec = array (
0 => array ( " pipe " , " r " ), // stdin
1 => array ( " pipe " , " w " ), // stdout
2 => array ( " pipe " , " w " ) // stderr
);
$sCMD = CONST_Osmosis_Binary . ' --read-xml - --read-empty --derive-change --write-xml-change ' . $sTemporaryFile ;
echo $sCMD . " \n " ;
$hProc = proc_open ( $sCMD , $aSpec , $aPipes );
if ( ! is_resource ( $hProc ))
{
2015-12-07 16:08:02 +03:00
fail ( " Error converting osm to osc, osmosis failed \n " );
2012-04-20 20:29:14 +04:00
}
fwrite ( $aPipes [ 0 ], $sModifyXMLstr );
fclose ( $aPipes [ 0 ]);
$sOut = stream_get_contents ( $aPipes [ 1 ]);
if ( $aResult [ 'verbose' ]) echo $sOut ;
fclose ( $aPipes [ 1 ]);
$sErrors = stream_get_contents ( $aPipes [ 2 ]);
if ( $aResult [ 'verbose' ]) echo $sErrors ;
fclose ( $aPipes [ 2 ]);
if ( $iError = proc_close ( $hProc ))
{
echo " Error converting osm to osc, osmosis returned: $iError\n " ;
echo $sOut ;
echo $sErrors ;
2015-12-07 16:08:02 +03:00
exit ( - 1 );
2012-04-20 20:29:14 +04:00
}
2011-03-18 15:36:17 +03:00
}
2012-04-20 20:29:14 +04:00
// import generated change file
2013-09-16 01:10:26 +04:00
$sCMD = $sOsm2pgsqlCmd . ' ' . $sTemporaryFile ;
2012-04-20 20:29:14 +04:00
echo $sCMD . " \n " ;
exec ( $sCMD , $sJunk , $iErrorLevel );
if ( $iErrorLevel )
2011-03-18 15:36:17 +03:00
{
2015-12-07 16:08:02 +03:00
fail ( " osm2pgsql exited with error level $iErrorLevel\n " );
2011-03-18 15:36:17 +03:00
}
}
if ( $aResult [ 'deduplicate' ])
{
2014-06-30 20:49:24 +04:00
$pgver = ( float ) CONST_Postgresql_Version ;
if ( $pgver < 9.3 ) {
2015-12-07 16:08:02 +03:00
fail ( " ERROR: deduplicate is only currently supported in postgresql 9.3 " );
2014-06-30 20:49:24 +04:00
}
2011-03-18 15:36:17 +03:00
$oDB =& getDB ();
$sSQL = 'select partition from country_name order by country_code' ;
$aPartitions = $oDB -> getCol ( $sSQL );
if ( PEAR :: isError ( $aPartitions ))
{
fail ( $aPartitions -> getMessage ());
}
$aPartitions [] = 0 ;
$sSQL = " select word_token,count(*) from word where substr(word_token, 1, 1) = ' ' and class is null and type is null and country_code is null group by word_token having count(*) > 1 order by word_token " ;
$aDuplicateTokens = $oDB -> getAll ( $sSQL );
foreach ( $aDuplicateTokens as $aToken )
{
if ( trim ( $aToken [ 'word_token' ]) == '' || trim ( $aToken [ 'word_token' ]) == '-' ) continue ;
echo " Deduping " . $aToken [ 'word_token' ] . " \n " ;
$sSQL = " select word_id,(select count(*) from search_name where nameaddress_vector @> ARRAY[word_id]) as num from word where word_token = ' " . $aToken [ 'word_token' ] . " ' and class is null and type is null and country_code is null order by num desc " ;
$aTokenSet = $oDB -> getAll ( $sSQL );
if ( PEAR :: isError ( $aTokenSet ))
{
var_dump ( $aTokenSet , $sSQL );
2015-12-07 15:51:30 +03:00
exit ( 1 );
2011-03-18 15:36:17 +03:00
}
2014-06-30 20:49:24 +04:00
2011-03-18 15:36:17 +03:00
$aKeep = array_shift ( $aTokenSet );
$iKeepID = $aKeep [ 'word_id' ];
foreach ( $aTokenSet as $aRemove )
{
$sSQL = " update search_name set " ;
2014-06-30 20:49:24 +04:00
$sSQL .= " name_vector = array_replace(name_vector, " . $aRemove [ 'word_id' ] . " , " . $iKeepID . " ), " ;
$sSQL .= " nameaddress_vector = array_replace(nameaddress_vector, " . $aRemove [ 'word_id' ] . " , " . $iKeepID . " ) " ;
2011-03-18 15:36:17 +03:00
$sSQL .= " where name_vector @> ARRAY[ " . $aRemove [ 'word_id' ] . " ] " ;
$x = $oDB -> query ( $sSQL );
if ( PEAR :: isError ( $x ))
{
var_dump ( $x );
2015-12-07 15:51:30 +03:00
exit ( 1 );
2011-03-18 15:36:17 +03:00
}
$sSQL = " update search_name set " ;
2014-06-30 20:49:24 +04:00
$sSQL .= " nameaddress_vector = array_replace(nameaddress_vector, " . $aRemove [ 'word_id' ] . " , " . $iKeepID . " ) " ;
2011-03-18 15:36:17 +03:00
$sSQL .= " where nameaddress_vector @> ARRAY[ " . $aRemove [ 'word_id' ] . " ] " ;
$x = $oDB -> query ( $sSQL );
if ( PEAR :: isError ( $x ))
{
var_dump ( $x );
2015-12-07 15:51:30 +03:00
exit ( 1 );
2011-03-18 15:36:17 +03:00
}
$sSQL = " update location_area_country set " ;
2014-06-30 20:49:24 +04:00
$sSQL .= " keywords = array_replace(keywords, " . $aRemove [ 'word_id' ] . " , " . $iKeepID . " ) " ;
2011-03-18 15:36:17 +03:00
$sSQL .= " where keywords @> ARRAY[ " . $aRemove [ 'word_id' ] . " ] " ;
$x = $oDB -> query ( $sSQL );
if ( PEAR :: isError ( $x ))
{
var_dump ( $x );
2015-12-07 15:51:30 +03:00
exit ( 1 );
2011-03-18 15:36:17 +03:00
}
foreach ( $aPartitions as $sPartition )
{
$sSQL = " update search_name_ " . $sPartition . " set " ;
2014-06-30 20:49:24 +04:00
$sSQL .= " name_vector = array_replace(name_vector, " . $aRemove [ 'word_id' ] . " , " . $iKeepID . " ) " ;
2011-03-18 15:36:17 +03:00
$sSQL .= " where name_vector @> ARRAY[ " . $aRemove [ 'word_id' ] . " ] " ;
$x = $oDB -> query ( $sSQL );
if ( PEAR :: isError ( $x ))
{
var_dump ( $x );
2015-12-07 15:51:30 +03:00
exit ( 1 );
2011-03-18 15:36:17 +03:00
}
$sSQL = " update location_area_country set " ;
2014-06-30 20:49:24 +04:00
$sSQL .= " keywords = array_replace(keywords, " . $aRemove [ 'word_id' ] . " , " . $iKeepID . " ) " ;
2011-03-18 15:36:17 +03:00
$sSQL .= " where keywords @> ARRAY[ " . $aRemove [ 'word_id' ] . " ] " ;
$x = $oDB -> query ( $sSQL );
if ( PEAR :: isError ( $x ))
{
var_dump ( $x );
2015-12-07 15:51:30 +03:00
exit ( 1 );
2011-03-18 15:36:17 +03:00
}
}
$sSQL = " delete from word where word_id = " . $aRemove [ 'word_id' ];
$x = $oDB -> query ( $sSQL );
if ( PEAR :: isError ( $x ))
{
var_dump ( $x );
2015-12-07 15:51:30 +03:00
exit ( 1 );
2011-03-18 15:36:17 +03:00
}
}
}
}
if ( $aResult [ 'index' ])
{
2016-02-28 18:42:24 +03:00
passthru ( CONST_InstallPath . '/nominatim/nominatim -i -d ' . $aDSNInfo [ 'database' ] . ' -P ' . $aDSNInfo [ 'port' ] . ' -t ' . $aResult [ 'index-instances' ] . ' -r ' . $aResult [ 'index-rank' ]);
2011-03-18 15:36:17 +03:00
}
if ( $aResult [ 'import-osmosis' ] || $aResult [ 'import-osmosis-all' ])
{
2013-09-19 15:22:29 +04:00
if ( strpos ( CONST_Replication_Url , 'download.geofabrik.de' ) !== false && CONST_Replication_Update_Interval < 86400 ) {
2015-12-07 16:08:02 +03:00
fail ( " Error: Update interval too low for download.geofabrik.de. Please check install documentation (http://wiki.openstreetmap.org/wiki/Nominatim/Installation#Updates) \n " );
2013-09-19 15:22:29 +04:00
}
2011-03-18 15:36:17 +03:00
$sImportFile = CONST_BasePath . '/data/osmosischange.osc' ;
2012-01-21 14:21:42 +04:00
$sOsmosisCMD = CONST_Osmosis_Binary ;
2016-02-28 18:42:24 +03:00
$sOsmosisConfigDirectory = CONST_InstallPath . '/settings' ;
2011-03-18 15:36:17 +03:00
$sCMDDownload = $sOsmosisCMD . ' --read-replication-interval workingDirectory=' . $sOsmosisConfigDirectory . ' --simplify-change --write-xml-change ' . $sImportFile ;
2013-03-26 18:49:35 +04:00
$sCMDCheckReplicationLag = $sOsmosisCMD . ' -q --read-replication-lag workingDirectory=' . $sOsmosisConfigDirectory ;
2013-09-16 01:10:26 +04:00
$sCMDImport = $sOsm2pgsqlCmd . ' ' . $sImportFile ;
2016-02-28 18:42:24 +03:00
$sCMDIndex = $sInstallPath . '/nominatim/nominatim -i -d ' . $aDSNInfo [ 'database' ] . ' -P ' . $aDSNInfo [ 'port' ] . ' -t ' . $aResult [ 'index-instances' ];
2012-01-21 14:21:42 +04:00
if ( ! $aResult [ 'no-npi' ]) {
$sCMDIndex .= '-F ' ;
}
2011-03-18 15:36:17 +03:00
while ( true )
{
$fStartTime = time ();
$iFileSize = 1001 ;
// Logic behind this is that osm2pgsql locks the database quite a bit
// So it is better to import lots of small files
// But indexing works most efficiently on large amounts of data
// So do lots of small imports and a BIG index
// while($aResult['import-osmosis-all'] && $iFileSize > 1000)
// {
if ( ! file_exists ( $sImportFile ))
{
2013-03-26 18:49:35 +04:00
// First check if there are new updates published (except for minutelies - there's always new diffs to process)
if ( CONST_Replication_Update_Interval > 60 )
{
unset ( $aReplicationLag );
exec ( $sCMDCheckReplicationLag , $aReplicationLag , $iErrorLevel );
2013-08-30 12:42:21 +04:00
while ( $iErrorLevel > 0 || $aReplicationLag [ 0 ] < 1 )
2013-03-26 18:49:35 +04:00
{
if ( $iErrorLevel )
{
echo " Error: $iErrorLevel . " ;
echo " Re-trying: " . $sCMDCheckReplicationLag . " in " . CONST_Replication_Recheck_Interval . " secs \n " ;
}
else
{
echo " . " ;
}
sleep ( CONST_Replication_Recheck_Interval );
unset ( $aReplicationLag );
exec ( $sCMDCheckReplicationLag , $aReplicationLag , $iErrorLevel );
}
// There are new replication files - use osmosis to download the file
2013-09-30 16:44:50 +04:00
echo " \n " . date ( 'Y-m-d H:i:s' ) . " Replication Delay is " . $aReplicationLag [ 0 ] . " \n " ;
2013-03-26 18:49:35 +04:00
}
2013-10-02 13:53:21 +04:00
$fStartTime = time ();
2011-03-18 15:36:17 +03:00
$fCMDStartTime = time ();
echo $sCMDDownload . " \n " ;
exec ( $sCMDDownload , $sJunk , $iErrorLevel );
2013-08-30 12:42:21 +04:00
while ( $iErrorLevel > 0 )
2011-03-18 15:36:17 +03:00
{
echo " Error: $iErrorLevel\n " ;
2011-04-27 16:14:33 +04:00
sleep ( 60 );
echo 'Re-trying: ' . $sCMDDownload . " \n " ;
exec ( $sCMDDownload , $sJunk , $iErrorLevel );
2011-03-18 15:36:17 +03:00
}
$iFileSize = filesize ( $sImportFile );
$sBatchEnd = getosmosistimestamp ( $sOsmosisConfigDirectory );
$sSQL = " INSERT INTO import_osmosis_log values (' $sBatchEnd ', $iFileSize ,' " . date ( 'Y-m-d H:i:s' , $fCMDStartTime ) . " ',' " . date ( 'Y-m-d H:i:s' ) . " ','osmosis') " ;
2013-09-30 16:25:30 +04:00
var_Dump ( $sSQL );
2011-03-18 15:36:17 +03:00
$oDB -> query ( $sSQL );
2013-10-02 13:53:21 +04:00
echo date ( 'Y-m-d H:i:s' ) . " Completed osmosis step for $sBatchEnd in " . round (( time () - $fCMDStartTime ) / 60 , 2 ) . " minutes \n " ;
2011-03-18 15:36:17 +03:00
}
$iFileSize = filesize ( $sImportFile );
$sBatchEnd = getosmosistimestamp ( $sOsmosisConfigDirectory );
// Import the file
$fCMDStartTime = time ();
echo $sCMDImport . " \n " ;
exec ( $sCMDImport , $sJunk , $iErrorLevel );
if ( $iErrorLevel )
{
echo " Error: $iErrorLevel\n " ;
2013-09-26 01:05:47 +04:00
exit ( $iErrorLevel );
2011-03-18 15:36:17 +03:00
}
$sSQL = " INSERT INTO import_osmosis_log values (' $sBatchEnd ', $iFileSize ,' " . date ( 'Y-m-d H:i:s' , $fCMDStartTime ) . " ',' " . date ( 'Y-m-d H:i:s' ) . " ','osm2pgsql') " ;
var_Dump ( $sSQL );
$oDB -> query ( $sSQL );
2013-10-02 13:53:21 +04:00
echo date ( 'Y-m-d H:i:s' ) . " Completed osm2pgsql step for $sBatchEnd in " . round (( time () - $fCMDStartTime ) / 60 , 2 ) . " minutes \n " ;
2011-03-18 15:36:17 +03:00
// Archive for debug?
unlink ( $sImportFile );
2012-05-22 18:27:42 +04:00
// }
2011-03-18 15:36:17 +03:00
2012-05-22 18:27:42 +04:00
$sBatchEnd = getosmosistimestamp ( $sOsmosisConfigDirectory );
// Index file
$sThisIndexCmd = $sCMDIndex ;
2013-09-30 16:25:30 +04:00
$fCMDStartTime = time ();
2011-03-18 15:36:17 +03:00
2012-05-22 18:27:42 +04:00
if ( ! $aResult [ 'no-npi' ])
{
2011-03-18 15:36:17 +03:00
$iFileID = $oDB -> getOne ( 'select nextval(\'file\')' );
if ( PEAR :: isError ( $iFileID ))
{
2011-09-09 20:00:34 +04:00
echo $iFileID -> getMessage () . " \n " ;
2013-09-26 01:05:47 +04:00
exit ( - 1 );
2011-03-18 15:36:17 +03:00
}
$sFileDir = CONST_BasePath . '/export/diff/' ;
$sFileDir .= str_pad ( floor ( $iFileID / 1000000 ), 3 , '0' , STR_PAD_LEFT );
$sFileDir .= '/' . str_pad ( floor ( $iFileID / 1000 ) % 1000 , 3 , '0' , STR_PAD_LEFT );
if ( ! is_dir ( $sFileDir )) mkdir ( $sFileDir , 0777 , true );
2012-05-22 18:27:42 +04:00
$sThisIndexCmd .= $sFileDir ;
$sThisIndexCmd .= '/' . str_pad ( $iFileID % 1000 , 3 , '0' , STR_PAD_LEFT );
$sThisIndexCmd .= " .npi.out " ;
preg_match ( '#^([0-9]{4})-([0-9]{2})-([0-9]{2})#' , $sBatchEnd , $aBatchMatch );
$sFileDir = CONST_BasePath . '/export/index/' ;
$sFileDir .= $aBatchMatch [ 1 ] . '/' . $aBatchMatch [ 2 ];
2011-03-18 15:36:17 +03:00
2012-05-22 18:27:42 +04:00
if ( ! is_dir ( $sFileDir )) mkdir ( $sFileDir , 0777 , true );
file_put_contents ( $sFileDir . '/' . $aBatchMatch [ 3 ] . '.idx' , " $sBatchEnd\t $iFileID\n " , FILE_APPEND );
}
if ( ! $aResult [ 'no-index' ])
{
2011-03-18 15:36:17 +03:00
echo " $sThisIndexCmd\n " ;
exec ( $sThisIndexCmd , $sJunk , $iErrorLevel );
if ( $iErrorLevel )
{
echo " Error: $iErrorLevel\n " ;
2013-09-26 01:05:47 +04:00
exit ( $iErrorLevel );
2011-03-18 15:36:17 +03:00
}
2012-05-22 18:27:42 +04:00
if ( ! $aResult [ 'no-npi' ])
{
2012-01-21 14:21:42 +04:00
$sFileDir = CONST_BasePath . '/export/diff/' ;
$sFileDir .= str_pad ( floor ( $iFileID / 1000000 ), 3 , '0' , STR_PAD_LEFT );
$sFileDir .= '/' . str_pad ( floor ( $iFileID / 1000 ) % 1000 , 3 , '0' , STR_PAD_LEFT );
$sThisIndexCmd = 'bzip2 -z9 ' . $sFileDir . '/' . str_pad ( $iFileID % 1000 , 3 , '0' , STR_PAD_LEFT ) . " .npi.out " ;
echo " $sThisIndexCmd\n " ;
exec ( $sThisIndexCmd , $sJunk , $iErrorLevel );
if ( $iErrorLevel )
{
echo " Error: $iErrorLevel\n " ;
2013-09-26 01:05:47 +04:00
exit ( $iErrorLevel );
2012-01-21 14:21:42 +04:00
}
rename ( $sFileDir . '/' . str_pad ( $iFileID % 1000 , 3 , '0' , STR_PAD_LEFT ) . " .npi.out.bz2 " ,
$sFileDir . '/' . str_pad ( $iFileID % 1000 , 3 , '0' , STR_PAD_LEFT ) . " .npi.bz2 " );
}
2012-05-22 18:27:42 +04:00
}
2011-03-18 15:36:17 +03:00
2012-05-22 18:27:42 +04:00
$sSQL = " INSERT INTO import_osmosis_log values (' $sBatchEnd ', $iFileSize ,' " . date ( 'Y-m-d H:i:s' , $fCMDStartTime ) . " ',' " . date ( 'Y-m-d H:i:s' ) . " ','index') " ;
2013-09-30 16:25:30 +04:00
var_Dump ( $sSQL );
2012-05-22 18:27:42 +04:00
$oDB -> query ( $sSQL );
2013-10-02 13:53:21 +04:00
echo date ( 'Y-m-d H:i:s' ) . " Completed index step for $sBatchEnd in " . round (( time () - $fCMDStartTime ) / 60 , 2 ) . " minutes \n " ;
2011-03-18 15:36:17 +03:00
2012-05-22 18:27:42 +04:00
$sSQL = " update import_status set lastimportdate = ' $sBatchEnd ' " ;
$oDB -> query ( $sSQL );
2011-03-18 15:36:17 +03:00
2012-05-22 18:27:42 +04:00
$fDuration = time () - $fStartTime ;
2013-10-02 13:53:21 +04:00
echo date ( 'Y-m-d H:i:s' ) . " Completed all for $sBatchEnd in " . round ( $fDuration / 60 , 2 ) . " minutes \n " ;
2015-12-07 15:51:30 +03:00
if ( ! $aResult [ 'import-osmosis-all' ]) exit ( 0 );
2011-03-18 15:36:17 +03:00
2013-03-26 18:49:35 +04:00
if ( CONST_Replication_Update_Interval > 60 )
{
2013-09-20 00:56:55 +04:00
$iSleep = max ( 0 ,( strtotime ( $sBatchEnd ) + CONST_Replication_Update_Interval - time ()));
2013-03-26 18:49:35 +04:00
}
else
{
$iSleep = max ( 0 , CONST_Replication_Update_Interval - $fDuration );
}
2013-09-30 16:44:50 +04:00
echo date ( 'Y-m-d H:i:s' ) . " Sleeping $iSleep seconds \n " ;
2013-03-26 18:49:35 +04:00
sleep ( $iSleep );
2011-03-18 15:36:17 +03:00
}
2012-05-22 18:27:42 +04:00
2011-03-18 15:36:17 +03:00
}
if ( $aResult [ 'import-npi-all' ])
{
$iNPIID = $oDB -> getOne ( 'select max(npiid) from import_npi_log' );
if ( PEAR :: isError ( $iNPIID ))
{
var_dump ( $iNPIID );
2015-12-07 15:51:30 +03:00
exit ( 1 );
2011-03-18 15:36:17 +03:00
}
2016-02-28 18:42:24 +03:00
$sConfigDirectory = CONST_InstallPath . '/settings' ;
$sCMDImportTemplate = $sBasePath . '/nominatim/nominatim -d gazetteer -P 5433 -I -T ' . CONST_BasePath . '/nominatim/partitionedtags.def -F ' ;
2011-03-18 15:36:17 +03:00
while ( true )
{
$fStartTime = time ();
$iNPIID ++ ;
$sImportFile = CONST_BasePath . '/export/diff/' ;
$sImportFile .= str_pad ( floor ( $iNPIID / 1000000 ), 3 , '0' , STR_PAD_LEFT );
$sImportFile .= '/' . str_pad ( floor ( $iNPIID / 1000 ) % 1000 , 3 , '0' , STR_PAD_LEFT );
$sImportFile .= '/' . str_pad ( $iNPIID % 1000 , 3 , '0' , STR_PAD_LEFT );
$sImportFile .= " .npi " ;
while ( ! file_exists ( $sImportFile ) && ! file_exists ( $sImportFile . '.bz2' ))
{
2011-04-27 16:14:33 +04:00
echo " sleep (waiting for $sImportFile ) \n " ;
2011-03-18 15:36:17 +03:00
sleep ( 10 );
}
if ( file_exists ( $sImportFile . '.bz2' )) $sImportFile .= '.bz2' ;
$iFileSize = filesize ( $sImportFile );
// Import the file
$fCMDStartTime = time ();
$sCMDImport = $sCMDImportTemplate . $sImportFile ;
echo $sCMDImport . " \n " ;
exec ( $sCMDImport , $sJunk , $iErrorLevel );
if ( $iErrorLevel )
{
2015-12-07 16:08:02 +03:00
fail ( " Error: $iErrorLevel\n " );
2011-03-18 15:36:17 +03:00
}
$sBatchEnd = $iNPIID ;
echo " Completed for $sBatchEnd in " . round (( time () - $fCMDStartTime ) / 60 , 2 ) . " minutes \n " ;
$sSQL = " INSERT INTO import_npi_log values ( $iNPIID , null, $iFileSize ,' " . date ( 'Y-m-d H:i:s' , $fCMDStartTime ) . " ',' " . date ( 'Y-m-d H:i:s' ) . " ','import') " ;
var_Dump ( $sSQL );
$oDB -> query ( $sSQL );
}
}
function getosmosistimestamp ( $sOsmosisConfigDirectory )
{
$sStateFile = file_get_contents ( $sOsmosisConfigDirectory . '/state.txt' );
preg_match ( '#timestamp=(.+)#' , $sStateFile , $aResult );
return str_replace ( '\:' , ':' , $aResult [ 1 ]);
}