2018-05-15 00:04:15 +03:00
|
|
|
<?php
|
|
|
|
|
|
|
|
namespace Nominatim;
|
|
|
|
|
2020-12-15 12:09:55 +03:00
|
|
|
require_once(CONST_LibDir.'/TokenCountry.php');
|
|
|
|
require_once(CONST_LibDir.'/TokenHousenumber.php');
|
|
|
|
require_once(CONST_LibDir.'/TokenPostcode.php');
|
|
|
|
require_once(CONST_LibDir.'/TokenSpecialTerm.php');
|
|
|
|
require_once(CONST_LibDir.'/TokenWord.php');
|
2021-07-13 17:54:51 +03:00
|
|
|
require_once(CONST_LibDir.'/TokenPartial.php');
|
2020-12-15 12:09:55 +03:00
|
|
|
require_once(CONST_LibDir.'/SpecialSearchOperator.php');
|
2018-05-15 00:04:15 +03:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Saves information about the tokens that appear in a search query.
|
|
|
|
*
|
2018-05-15 00:17:54 +03:00
|
|
|
* Tokens are sorted by their normalized form, the token word. There are different
|
|
|
|
* kinds of tokens, represented by different Token* classes. Note that
|
|
|
|
* tokens do not have a common base class. All tokens need to have a field
|
|
|
|
* with the word id that points to an entry in the `word` database table
|
|
|
|
* but otherwise the information saved about a token can be very different.
|
2018-05-15 00:04:15 +03:00
|
|
|
*/
|
|
|
|
class TokenList
|
|
|
|
{
|
|
|
|
// List of list of tokens indexed by their word_token.
|
|
|
|
private $aTokens = array();
|
|
|
|
|
2018-07-19 03:31:54 +03:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Return total number of tokens.
|
|
|
|
*
|
|
|
|
* @return Integer
|
|
|
|
*/
|
|
|
|
public function count()
|
|
|
|
{
|
|
|
|
return count($this->aTokens);
|
|
|
|
}
|
|
|
|
|
2018-05-15 00:17:54 +03:00
|
|
|
/**
|
|
|
|
* Check if there are tokens for the given token word.
|
|
|
|
*
|
|
|
|
* @param string $sWord Token word to look for.
|
|
|
|
*
|
|
|
|
* @return bool True if there is one or more token for the token word.
|
|
|
|
*/
|
2018-05-15 00:04:15 +03:00
|
|
|
public function contains($sWord)
|
|
|
|
{
|
|
|
|
return isset($this->aTokens[$sWord]);
|
|
|
|
}
|
|
|
|
|
2019-06-29 19:22:31 +03:00
|
|
|
/**
|
|
|
|
* Check if there are partial or full tokens for the given word.
|
|
|
|
*
|
|
|
|
* @param string $sWord Token word to look for.
|
|
|
|
*
|
|
|
|
* @return bool True if there is one or more token for the token word.
|
|
|
|
*/
|
|
|
|
public function containsAny($sWord)
|
|
|
|
{
|
2021-07-14 23:17:17 +03:00
|
|
|
return isset($this->aTokens[$sWord]);
|
2019-06-29 19:22:31 +03:00
|
|
|
}
|
|
|
|
|
2018-05-15 00:17:54 +03:00
|
|
|
/**
|
|
|
|
* Get the list of tokens for the given token word.
|
|
|
|
*
|
|
|
|
* @param string $sWord Token word to look for.
|
|
|
|
*
|
|
|
|
* @return object[] Array of tokens for the given token word or an
|
|
|
|
* empty array if no tokens could be found.
|
|
|
|
*/
|
2018-05-15 00:04:15 +03:00
|
|
|
public function get($sWord)
|
|
|
|
{
|
|
|
|
return isset($this->aTokens[$sWord]) ? $this->aTokens[$sWord] : array();
|
|
|
|
}
|
|
|
|
|
2020-11-25 13:44:25 +03:00
|
|
|
public function getFullWordIDs()
|
|
|
|
{
|
|
|
|
$ids = array();
|
|
|
|
|
2020-11-25 18:14:31 +03:00
|
|
|
foreach ($this->aTokens as $aTokenList) {
|
|
|
|
foreach ($aTokenList as $oToken) {
|
2021-07-14 23:17:17 +03:00
|
|
|
if (is_a($oToken, '\Nominatim\Token\Word')) {
|
2021-07-17 21:24:33 +03:00
|
|
|
$ids[$oToken->getId()] = $oToken->getId();
|
2020-11-25 13:44:25 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return $ids;
|
|
|
|
}
|
|
|
|
|
2018-05-15 00:04:15 +03:00
|
|
|
/**
|
|
|
|
* Add a new token for the given word.
|
|
|
|
*
|
|
|
|
* @param string $sWord Word the token describes.
|
|
|
|
* @param object $oToken Token object to add.
|
|
|
|
*
|
|
|
|
* @return void
|
|
|
|
*/
|
|
|
|
public function addToken($sWord, $oToken)
|
|
|
|
{
|
|
|
|
if (isset($this->aTokens[$sWord])) {
|
|
|
|
$this->aTokens[$sWord][] = $oToken;
|
|
|
|
} else {
|
|
|
|
$this->aTokens[$sWord] = array($oToken);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public function debugTokenByWordIdList()
|
|
|
|
{
|
|
|
|
$aWordsIDs = array();
|
|
|
|
foreach ($this->aTokens as $sToken => $aWords) {
|
|
|
|
foreach ($aWords as $aToken) {
|
2021-07-17 21:24:33 +03:00
|
|
|
$iId = $aToken->getId();
|
|
|
|
if ($iId !== null) {
|
|
|
|
$aWordsIDs[$iId] = '#'.$sToken.'('.$aToken->debugCode().' '.$iId.')#';
|
2018-05-15 00:04:15 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return $aWordsIDs;
|
|
|
|
}
|
|
|
|
|
|
|
|
public function debugInfo()
|
|
|
|
{
|
|
|
|
return $this->aTokens;
|
|
|
|
}
|
|
|
|
}
|