oDB =& $oDB; $this->oPlaceLookup = new PlaceLookup($this->oDB); $this->oNormalizer = \Transliterator::createFromRules(CONST_Term_Normalization_Rules); } private function normTerm($sTerm) { if ($this->oNormalizer === null) { return $sTerm; } return $this->oNormalizer->transliterate($sTerm); } public function setReverseInPlan($bReverse) { $this->bReverseInPlan = $bReverse; } public function setLanguagePreference($aLangPref) { $this->aLangPrefOrder = $aLangPref; } public function getMoreUrlParams() { if ($this->aStructuredQuery) { $aParams = $this->aStructuredQuery; } else { $aParams = array('q' => $this->sQuery); } $aParams = array_merge($aParams, $this->oPlaceLookup->getMoreUrlParams()); if ($this->aExcludePlaceIDs) { $aParams['exclude_place_ids'] = implode(',', $this->aExcludePlaceIDs); } if ($this->bBoundedSearch) $aParams['bounded'] = '1'; if ($this->aCountryCodes) { $aParams['countrycodes'] = implode(',', $this->aCountryCodes); } if ($this->aViewBox) { $aParams['viewbox'] = join(',', $this->aViewBox); } return $aParams; } public function setLimit($iLimit = 10) { if ($iLimit > 50) $iLimit = 50; if ($iLimit < 1) $iLimit = 1; $this->iFinalLimit = $iLimit; $this->iLimit = $iLimit + min($iLimit, 10); } public function setFeatureType($sFeatureType) { switch ($sFeatureType) { case 'country': $this->setRankRange(4, 4); break; case 'state': $this->setRankRange(8, 8); break; case 'city': $this->setRankRange(14, 16); break; case 'settlement': $this->setRankRange(8, 20); break; } } public function setRankRange($iMin, $iMax) { $this->iMinAddressRank = $iMin; $this->iMaxAddressRank = $iMax; } public function setViewbox($aViewbox) { $aBox = array_map('floatval', $aViewbox); $this->aViewBox[0] = max(-180.0, min($aBox[0], $aBox[2])); $this->aViewBox[1] = max(-90.0, min($aBox[1], $aBox[3])); $this->aViewBox[2] = min(180.0, max($aBox[0], $aBox[2])); $this->aViewBox[3] = min(90.0, max($aBox[1], $aBox[3])); if ($this->aViewBox[2] - $this->aViewBox[0] < 0.000000001 || $this->aViewBox[3] - $this->aViewBox[1] < 0.000000001 ) { userError("Bad parameter 'viewbox'. Not a box."); } } private function viewboxImportanceFactor($fX, $fY) { if (!$this->aViewBox) { return 1; } $fWidth = ($this->aViewBox[2] - $this->aViewBox[0])/2; $fHeight = ($this->aViewBox[3] - $this->aViewBox[1])/2; $fXDist = abs($fX - ($this->aViewBox[0] + $this->aViewBox[2])/2); $fYDist = abs($fY - ($this->aViewBox[1] + $this->aViewBox[3])/2); if ($fXDist <= $fWidth && $fYDist <= $fHeight) { return 1; } if ($fXDist <= $fWidth * 3 && $fYDist <= 3 * $fHeight) { return 0.5; } return 0.25; } public function setQuery($sQueryString) { $this->sQuery = $sQueryString; $this->aStructuredQuery = false; } public function getQueryString() { return $this->sQuery; } public function loadParamArray($oParams, $sForceGeometryType = null) { $this->bBoundedSearch = $oParams->getBool('bounded', $this->bBoundedSearch); $this->setLimit($oParams->getInt('limit', $this->iFinalLimit)); $this->iOffset = $oParams->getInt('offset', $this->iOffset); $this->bFallback = $oParams->getBool('fallback', $this->bFallback); // List of excluded Place IDs - used for more acurate pageing $sExcluded = $oParams->getStringList('exclude_place_ids'); if ($sExcluded) { foreach ($sExcluded as $iExcludedPlaceID) { $iExcludedPlaceID = (int)$iExcludedPlaceID; if ($iExcludedPlaceID) $aExcludePlaceIDs[$iExcludedPlaceID] = $iExcludedPlaceID; } if (isset($aExcludePlaceIDs)) $this->aExcludePlaceIDs = $aExcludePlaceIDs; } // Only certain ranks of feature $sFeatureType = $oParams->getString('featureType'); if (!$sFeatureType) $sFeatureType = $oParams->getString('featuretype'); if ($sFeatureType) $this->setFeatureType($sFeatureType); // Country code list $sCountries = $oParams->getStringList('countrycodes'); if ($sCountries) { foreach ($sCountries as $sCountryCode) { if (preg_match('/^[a-zA-Z][a-zA-Z]$/', $sCountryCode)) { $aCountries[] = strtolower($sCountryCode); } } if (isset($aCountries)) $this->aCountryCodes = $aCountries; } $aViewbox = $oParams->getStringList('viewboxlbrt'); if ($aViewbox) { if (count($aViewbox) != 4) { userError("Bad parameter 'viewboxlbrt'. Expected 4 coordinates."); } $this->setViewbox($aViewbox); } else { $aViewbox = $oParams->getStringList('viewbox'); if ($aViewbox) { if (count($aViewbox) != 4) { userError("Bad parameter 'viewbox'. Expected 4 coordinates."); } $this->setViewBox($aViewbox); } else { $aRoute = $oParams->getStringList('route'); $fRouteWidth = $oParams->getFloat('routewidth'); if ($aRoute && $fRouteWidth) { $this->aRoutePoints = $aRoute; $this->aRouteWidth = $fRouteWidth; } } } $this->oPlaceLookup->loadParamArray($oParams, $sForceGeometryType); $this->oPlaceLookup->setIncludePolygonAsPoints($oParams->getBool('polygon')); $this->oPlaceLookup->setIncludeAddressDetails($oParams->getBool('addressdetails', false)); } public function setQueryFromParams($oParams) { // Search query $sQuery = $oParams->getString('q'); if (!$sQuery) { $this->setStructuredQuery( $oParams->getString('amenity'), $oParams->getString('street'), $oParams->getString('city'), $oParams->getString('county'), $oParams->getString('state'), $oParams->getString('country'), $oParams->getString('postalcode') ); $this->setReverseInPlan(false); } else { $this->setQuery($sQuery); } } public function loadStructuredAddressElement($sValue, $sKey, $iNewMinAddressRank, $iNewMaxAddressRank, $aItemListValues) { $sValue = trim($sValue); if (!$sValue) return false; $this->aStructuredQuery[$sKey] = $sValue; if ($this->iMinAddressRank == 0 && $this->iMaxAddressRank == 30) { $this->iMinAddressRank = $iNewMinAddressRank; $this->iMaxAddressRank = $iNewMaxAddressRank; } if ($aItemListValues) $this->aAddressRankList = array_merge($this->aAddressRankList, $aItemListValues); return true; } public function setStructuredQuery($sAmenity = false, $sStreet = false, $sCity = false, $sCounty = false, $sState = false, $sCountry = false, $sPostalCode = false) { $this->sQuery = false; // Reset $this->iMinAddressRank = 0; $this->iMaxAddressRank = 30; $this->aAddressRankList = array(); $this->aStructuredQuery = array(); $this->sAllowedTypesSQLList = false; $this->loadStructuredAddressElement($sAmenity, 'amenity', 26, 30, false); $this->loadStructuredAddressElement($sStreet, 'street', 26, 30, false); $this->loadStructuredAddressElement($sCity, 'city', 14, 24, false); $this->loadStructuredAddressElement($sCounty, 'county', 9, 13, false); $this->loadStructuredAddressElement($sState, 'state', 8, 8, false); $this->loadStructuredAddressElement($sPostalCode, 'postalcode', 5, 11, array(5, 11)); $this->loadStructuredAddressElement($sCountry, 'country', 4, 4, false); if (!empty($this->aStructuredQuery)) { $this->sQuery = join(', ', $this->aStructuredQuery); if ($this->iMaxAddressRank < 30) { $this->sAllowedTypesSQLList = '(\'place\',\'boundary\')'; } } } public function fallbackStructuredQuery() { if (!$this->aStructuredQuery) return false; $aParams = $this->aStructuredQuery; if (count($aParams) == 1) return false; $aOrderToFallback = array('postalcode', 'street', 'city', 'county', 'state'); foreach ($aOrderToFallback as $sType) { if (isset($aParams[$sType])) { unset($aParams[$sType]); $this->setStructuredQuery(@$aParams['amenity'], @$aParams['street'], @$aParams['city'], @$aParams['county'], @$aParams['state'], @$aParams['country'], @$aParams['postalcode']); return true; } } return false; } public function getGroupedSearches($aSearches, $aPhrases, $oValidTokens, $bIsStructured) { /* Calculate all searches using oValidTokens i.e. 'Wodsworth Road, Sheffield' => Phrase Wordset 0 0 (wodsworth road) 0 1 (wodsworth)(road) 1 0 (sheffield) Score how good the search is so they can be ordered */ foreach ($aPhrases as $iPhrase => $oPhrase) { $aNewPhraseSearches = array(); $sPhraseType = $bIsStructured ? $oPhrase->getPhraseType() : ''; foreach ($oPhrase->getWordSets() as $iWordSet => $aWordset) { // Too many permutations - too expensive if ($iWordSet > 120) break; $aWordsetSearches = $aSearches; // Add all words from this wordset foreach ($aWordset as $iToken => $sToken) { //echo "
$sToken"; $aNewWordsetSearches = array(); foreach ($aWordsetSearches as $oCurrentSearch) { //echo ""; //var_dump($oCurrentSearch); //echo ""; // Tokens with full name matches. foreach ($oValidTokens->get(' '.$sToken) as $oSearchTerm) { $aNewSearches = $oCurrentSearch->extendWithFullTerm( $oSearchTerm, $oValidTokens->contains($sToken) && strpos($sToken, ' ') === false, $sPhraseType, $iToken == 0 && $iPhrase == 0, $iPhrase == 0, $iToken + 1 == count($aWordset) && $iPhrase + 1 == count($aPhrases) ); foreach ($aNewSearches as $oSearch) { if ($oSearch->getRank() < $this->iMaxRank) { $aNewWordsetSearches[] = $oSearch; } } } // Look for partial matches. // Note that there is no point in adding country terms here // because country is omitted in the address. if ($sPhraseType != 'country') { // Allow searching for a word - but at extra cost foreach ($oValidTokens->get($sToken) as $oSearchTerm) { $aNewSearches = $oCurrentSearch->extendWithPartialTerm( $sToken, $oSearchTerm, $bIsStructured, $iPhrase, $oValidTokens->get(' '.$sToken) ); foreach ($aNewSearches as $oSearch) { if ($oSearch->getRank() < $this->iMaxRank) { $aNewWordsetSearches[] = $oSearch; } } } } } // Sort and cut usort($aNewWordsetSearches, array('Nominatim\SearchDescription', 'bySearchRank')); $aWordsetSearches = array_slice($aNewWordsetSearches, 0, 50); } //var_Dump('
',count($aWordsetSearches)); exit; $aNewPhraseSearches = array_merge($aNewPhraseSearches, $aNewWordsetSearches); usort($aNewPhraseSearches, array('Nominatim\SearchDescription', 'bySearchRank')); $aSearchHash = array(); foreach ($aNewPhraseSearches as $iSearch => $aSearch) { $sHash = serialize($aSearch); if (isset($aSearchHash[$sHash])) unset($aNewPhraseSearches[$iSearch]); else $aSearchHash[$sHash] = 1; } $aNewPhraseSearches = array_slice($aNewPhraseSearches, 0, 50); } // Re-group the searches by their score, junk anything over 20 as just not worth trying $aGroupedSearches = array(); foreach ($aNewPhraseSearches as $aSearch) { $iRank = $aSearch->getRank(); if ($iRank < $this->iMaxRank) { if (!isset($aGroupedSearches[$iRank])) { $aGroupedSearches[$iRank] = array(); } $aGroupedSearches[$iRank][] = $aSearch; } } ksort($aGroupedSearches); $iSearchCount = 0; $aSearches = array(); foreach ($aGroupedSearches as $iScore => $aNewSearches) { $iSearchCount += count($aNewSearches); $aSearches = array_merge($aSearches, $aNewSearches); if ($iSearchCount > 50) break; } } // Revisit searches, drop bad searches and give penalty to unlikely combinations. $aGroupedSearches = array(); foreach ($aSearches as $oSearch) { if (!$oSearch->isValidSearch()) { continue; } $iRank = $oSearch->getRank(); if (!isset($aGroupedSearches[$iRank])) { $aGroupedSearches[$iRank] = array(); } $aGroupedSearches[$iRank][] = $oSearch; } ksort($aGroupedSearches); return $aGroupedSearches; } /* Perform the actual query lookup. Returns an ordered list of results, each with the following fields: osm_type: type of corresponding OSM object N - node W - way R - relation P - postcode (internally computed) osm_id: id of corresponding OSM object class: general object class (corresponds to tag key of primary OSM tag) type: subclass of object (corresponds to tag value of primary OSM tag) admin_level: see https://wiki.openstreetmap.org/wiki/Admin_level rank_search: rank in search hierarchy (see also https://wiki.openstreetmap.org/wiki/Nominatim/Development_overview#Country_to_street_level) rank_address: rank in address hierarchy (determines orer in address) place_id: internal key (may differ between different instances) country_code: ISO country code langaddress: localized full address placename: localized name of object ref: content of ref tag (if available) lon: longitude lat: latitude importance: importance of place based on Wikipedia link count addressimportance: cumulated importance of address elements extra_place: type of place (for admin boundaries, if there is a place tag) aBoundingBox: bounding Box label: short description of the object class/type (English only) name: full name (currently the same as langaddress) foundorder: secondary ordering for places with same importance */ public function lookup() { Debug::newFunction('Geocode::lookup'); if (!$this->sQuery && !$this->aStructuredQuery) return array(); Debug::printDebugArray('Geocode', $this); $oCtx = new SearchContext(); if ($this->aRoutePoints) { $oCtx->setViewboxFromRoute( $this->oDB, $this->aRoutePoints, $this->aRouteWidth, $this->bBoundedSearch ); } elseif ($this->aViewBox) { $oCtx->setViewboxFromBox($this->aViewBox, $this->bBoundedSearch); } if ($this->aExcludePlaceIDs) { $oCtx->setExcludeList($this->aExcludePlaceIDs); } if ($this->aCountryCodes) { $oCtx->setCountryList($this->aCountryCodes); } Debug::newSection('Query Preprocessing'); $sNormQuery = $this->normTerm($this->sQuery); Debug::printVar('Normalized query', $sNormQuery); $sLanguagePrefArraySQL = getArraySQL( array_map('getDBQuoted', $this->aLangPrefOrder) ); $sQuery = $this->sQuery; if (!preg_match('//u', $sQuery)) { userError('Query string is not UTF-8 encoded.'); } // Conflicts between US state abreviations and various words for 'the' in different languages if (isset($this->aLangPrefOrder['name:en'])) { $sQuery = preg_replace('/(^|,)\s*il\s*(,|$)/i', '\1illinois\2', $sQuery); $sQuery = preg_replace('/(^|,)\s*al\s*(,|$)/i', '\1alabama\2', $sQuery); $sQuery = preg_replace('/(^|,)\s*la\s*(,|$)/i', '\1louisiana\2', $sQuery); } // Do we have anything that looks like a lat/lon pair? $sQuery = $oCtx->setNearPointFromQuery($sQuery); $aResults = array(); if ($sQuery || $this->aStructuredQuery) { // Start with a single blank search $aSearches = array(new SearchDescription($oCtx)); if ($sQuery) { $sQuery = $aSearches[0]->extractKeyValuePairs($sQuery); } $sSpecialTerm = ''; if ($sQuery) { preg_match_all( '/\\[([\\w ]*)\\]/u', $sQuery, $aSpecialTermsRaw, PREG_SET_ORDER ); if (!empty($aSpecialTermsRaw)) { Debug::printVar('Special terms', $aSpecialTermsRaw); } foreach ($aSpecialTermsRaw as $aSpecialTerm) { $sQuery = str_replace($aSpecialTerm[0], ' ', $sQuery); if (!$sSpecialTerm) { $sSpecialTerm = $aSpecialTerm[1]; } } } if (!$sSpecialTerm && $this->aStructuredQuery && isset($this->aStructuredQuery['amenity'])) { $sSpecialTerm = $this->aStructuredQuery['amenity']; unset($this->aStructuredQuery['amenity']); } if ($sSpecialTerm && !$aSearches[0]->hasOperator()) { $sSpecialTerm = pg_escape_string($sSpecialTerm); $sToken = chksql( $this->oDB->getOne("SELECT make_standard_name('$sSpecialTerm')"), 'Cannot decode query. Wrong encoding?' ); $sSQL = 'SELECT class, type FROM word '; $sSQL .= ' WHERE word_token in (\' '.$sToken.'\')'; $sSQL .= ' AND class is not null AND class not in (\'place\')'; Debug::printSQL($sSQL); $aSearchWords = chksql($this->oDB->getAll($sSQL)); $aNewSearches = array(); foreach ($aSearches as $oSearch) { foreach ($aSearchWords as $aSearchTerm) { $oNewSearch = clone $oSearch; $oNewSearch->setPoiSearch( Operator::TYPE, $aSearchTerm['class'], $aSearchTerm['type'] ); $aNewSearches[] = $oNewSearch; } } $aSearches = $aNewSearches; } // Split query into phrases // Commas are used to reduce the search space by indicating where phrases split if ($this->aStructuredQuery) { $aInPhrases = $this->aStructuredQuery; $bStructuredPhrases = true; } else { $aInPhrases = explode(',', $sQuery); $bStructuredPhrases = false; } Debug::printDebugArray('Search context', $oCtx); Debug::printDebugArray('Base search', empty($aSearches) ? null : $aSearches[0]); Debug::printVar('Final query phrases', $aInPhrases); // Convert each phrase to standard form // Create a list of standard words // Get all 'sets' of words // Generate a complete list of all Debug::newSection('Tokenization'); $aTokens = array(); $aPhrases = array(); foreach ($aInPhrases as $iPhrase => $sPhrase) { $sPhrase = chksql( $this->oDB->getOne('SELECT make_standard_name('.getDBQuoted($sPhrase).')'), 'Cannot normalize query string (is it a UTF-8 string?)' ); if (trim($sPhrase)) { $oPhrase = new Phrase($sPhrase, is_string($iPhrase) ? $iPhrase : ''); $oPhrase->addTokens($aTokens); $aPhrases[] = $oPhrase; } } Debug::printDebugTable('Phrases', $aPhrases); Debug::printVar('Tokens', $aTokens); $oValidTokens = new TokenList(); if (!empty($aTokens)) { $sSQL = 'SELECT word_id, word_token, word, class, type, country_code, operator, search_name_count'; $sSQL .= ' FROM word '; $sSQL .= ' WHERE word_token in ('.join(',', array_map('getDBQuoted', $aTokens)).')'; Debug::printSQL($sSQL); $oValidTokens->addTokensFromDB( $this->oDB, $aTokens, $this->aCountryCodes, $sNormQuery, $this->oNormalizer ); // Try more interpretations for Tokens that could not be matched. foreach ($aTokens as $sToken) { if ($sToken[0] == ' ' && !$oValidTokens->contains($sToken)) { if (preg_match('/^ ([0-9]{5}) [0-9]{4}$/', $sToken, $aData)) { // US ZIP+4 codes - merge in the 5-digit ZIP code $oValidTokens->addToken( $sToken, new Token\Postcode(null, $aData[1], 'us') ); } elseif (preg_match('/^ [0-9]+$/', $sToken)) { // Unknown single word token with a number. // Assume it is a house number. $oValidTokens->addToken( $sToken, new Token\HouseNumber(null, trim($sToken)) ); } } } // Any words that have failed completely? // TODO: suggestions Debug::printGroupTable('Valid Tokens', $oValidTokens->debugInfo()); Debug::newSection('Search candidates'); $aGroupedSearches = $this->getGroupedSearches($aSearches, $aPhrases, $oValidTokens, $bStructuredPhrases); if ($this->bReverseInPlan) { // Reverse phrase array and also reverse the order of the wordsets in // the first and final phrase. Don't bother about phrases in the middle // because order in the address doesn't matter. $aPhrases = array_reverse($aPhrases); $aPhrases[0]->invertWordSets(); if (count($aPhrases) > 1) { $aPhrases[count($aPhrases)-1]->invertWordSets(); } $aReverseGroupedSearches = $this->getGroupedSearches($aSearches, $aPhrases, $oValidTokens, false); foreach ($aGroupedSearches as $aSearches) { foreach ($aSearches as $aSearch) { if (!isset($aReverseGroupedSearches[$aSearch->getRank()])) { $aReverseGroupedSearches[$aSearch->getRank()] = array(); } $aReverseGroupedSearches[$aSearch->getRank()][] = $aSearch; } } $aGroupedSearches = $aReverseGroupedSearches; ksort($aGroupedSearches); } } else { // Re-group the searches by their score, junk anything over 20 as just not worth trying $aGroupedSearches = array(); foreach ($aSearches as $aSearch) { if ($aSearch->getRank() < $this->iMaxRank) { if (!isset($aGroupedSearches[$aSearch->getRank()])) $aGroupedSearches[$aSearch->getRank()] = array(); $aGroupedSearches[$aSearch->getRank()][] = $aSearch; } } ksort($aGroupedSearches); } // Filter out duplicate searches $aSearchHash = array(); foreach ($aGroupedSearches as $iGroup => $aSearches) { foreach ($aSearches as $iSearch => $aSearch) { $sHash = serialize($aSearch); if (isset($aSearchHash[$sHash])) { unset($aGroupedSearches[$iGroup][$iSearch]); if (empty($aGroupedSearches[$iGroup])) unset($aGroupedSearches[$iGroup]); } else { $aSearchHash[$sHash] = 1; } } } Debug::printGroupedSearch( $aGroupedSearches, $oValidTokens->debugTokenByWordIdList() ); // Start the search process $iGroupLoop = 0; $iQueryLoop = 0; foreach ($aGroupedSearches as $iGroupedRank => $aSearches) { $iGroupLoop++; foreach ($aSearches as $oSearch) { $iQueryLoop++; Debug::newSection("Search Loop, group $iGroupLoop, loop $iQueryLoop"); Debug::printGroupedSearch( array($iGroupedRank => array($oSearch)), $oValidTokens->debugTokenByWordIdList() ); $aResults += $oSearch->query( $this->oDB, $this->iMinAddressRank, $this->iMaxAddressRank, $this->iLimit ); if ($iQueryLoop > 20) break; } if (!empty($aResults) && ($this->iMinAddressRank != 0 || $this->iMaxAddressRank != 30)) { // Need to verify passes rank limits before dropping out of the loop (yuk!) // reduces the number of place ids, like a filter // rank_address is 30 for interpolated housenumbers $aFilterSql = array(); $sPlaceIds = Result::joinIdsByTable($aResults, Result::TABLE_PLACEX); if ($sPlaceIds) { $sSQL = 'SELECT place_id FROM placex '; $sSQL .= 'WHERE place_id in ('.$sPlaceIds.') '; $sSQL .= ' AND ('; $sSQL .= " placex.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank "; if (14 >= $this->iMinAddressRank && 14 <= $this->iMaxAddressRank) { $sSQL .= " OR (extratags->'place') = 'city'"; } if ($this->aAddressRankList) { $sSQL .= ' OR placex.rank_address in ('.join(',', $this->aAddressRankList).')'; } $sSQL .= ')'; $aFilterSql[] = $sSQL; } $sPlaceIds = Result::joinIdsByTable($aResults, Result::TABLE_POSTCODE); if ($sPlaceIds) { $sSQL = ' SELECT place_id FROM location_postcode lp '; $sSQL .= 'WHERE place_id in ('.$sPlaceIds.') '; $sSQL .= " AND (lp.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank "; if ($this->aAddressRankList) { $sSQL .= ' OR lp.rank_address in ('.join(',', $this->aAddressRankList).')'; } $sSQL .= ') '; $aFilterSql[] = $sSQL; } $aFilteredIDs = array(); if ($aFilterSql) { $sSQL = join(' UNION ', $aFilterSql); Debug::printSQL($sSQL); $aFilteredIDs = chksql($this->oDB->getCol($sSQL)); } $tempIDs = array(); foreach ($aResults as $oResult) { if (($this->iMaxAddressRank == 30 && ($oResult->iTable == Result::TABLE_OSMLINE || $oResult->iTable == Result::TABLE_AUX || $oResult->iTable == Result::TABLE_TIGER)) || in_array($oResult->iId, $aFilteredIDs) ) { $tempIDs[$oResult->iId] = $oResult; } } $aResults = $tempIDs; } if (!empty($aResults)) break; if ($iGroupLoop > 4) break; if ($iQueryLoop > 30) break; } } else { // Just interpret as a reverse geocode $oReverse = new ReverseGeocode($this->oDB); $oReverse->setZoom(18); $oLookup = $oReverse->lookupPoint($oCtx->sqlNear, false); Debug::printVar('Reverse search', $oLookup); if ($oLookup) { $aResults = array($oLookup->iId => $oLookup); } } // No results? Done if (empty($aResults)) { if ($this->bFallback) { if ($this->fallbackStructuredQuery()) { return $this->lookup(); } } return array(); } if ($this->aAddressRankList) { $this->oPlaceLookup->setAddressRankList($this->aAddressRankList); } $this->oPlaceLookup->setAllowedTypesSQLList($this->sAllowedTypesSQLList); $this->oPlaceLookup->setLanguagePreference($this->aLangPrefOrder); if ($oCtx->hasNearPoint()) { $this->oPlaceLookup->setAnchorSql($oCtx->sqlNear); } $aSearchResults = $this->oPlaceLookup->lookup($aResults); $aClassType = ClassTypes\getListWithImportance(); $aRecheckWords = preg_split('/\b[\s,\\-]*/u', $sQuery); foreach ($aRecheckWords as $i => $sWord) { if (!preg_match('/[\pL\pN]/', $sWord)) unset($aRecheckWords[$i]); } Debug::printVar('Recheck words', $aRecheckWords); foreach ($aSearchResults as $iIdx => $aResult) { // Default $fDiameter = ClassTypes\getProperty($aResult, 'defdiameter', 0.0001); $aOutlineResult = $this->oPlaceLookup->getOutlines($aResult['place_id'], $aResult['lon'], $aResult['lat'], $fDiameter/2); if ($aOutlineResult) { $aResult = array_merge($aResult, $aOutlineResult); } if ($aResult['extra_place'] == 'city') { $aResult['class'] = 'place'; $aResult['type'] = 'city'; $aResult['rank_search'] = 16; } // Is there an icon set for this type of result? $aClassInfo = ClassTypes\getInfo($aResult); if ($aClassInfo) { if (isset($aClassInfo['icon'])) { $aResult['icon'] = CONST_Website_BaseURL.'images/mapicons/'.$aClassInfo['icon'].'.p.20.png'; } if (isset($aClassInfo['label'])) { $aResult['label'] = $aClassInfo['label']; } } $aResult['name'] = $aResult['langaddress']; if ($oCtx->hasNearPoint()) { $aResult['importance'] = 0.001; $aResult['foundorder'] = $aResult['addressimportance']; } else { $aResult['importance'] = max(0.001, $aResult['importance']); $aResult['importance'] *= $this->viewboxImportanceFactor( $aResult['lon'], $aResult['lat'] ); // Adjust importance for the number of exact string matches in the result $iCountWords = 0; $sAddress = $aResult['langaddress']; foreach ($aRecheckWords as $i => $sWord) { if (stripos($sAddress, $sWord)!==false) { $iCountWords++; if (preg_match('/(^|,)\s*'.preg_quote($sWord, '/').'\s*(,|$)/', $sAddress)) $iCountWords += 0.1; } } $aResult['importance'] = $aResult['importance'] + ($iCountWords*0.1); // 0.1 is a completely arbitrary number but something in the range 0.1 to 0.5 would seem right // secondary ordering (for results with same importance (the smaller the better): // - approximate importance of address parts $aResult['foundorder'] = -$aResult['addressimportance']/10; // - number of exact matches from the query $aResult['foundorder'] -= $aResults[$aResult['place_id']]->iExactMatches; // - importance of the class/type if (isset($aClassType[$aResult['class'].':'.$aResult['type']]['importance']) && $aClassType[$aResult['class'].':'.$aResult['type']]['importance'] ) { $aResult['foundorder'] += 0.0001 * $aClassType[$aResult['class'].':'.$aResult['type']]['importance']; } else { $aResult['foundorder'] += 0.01; } } $aSearchResults[$iIdx] = $aResult; } uasort($aSearchResults, 'byImportance'); Debug::printVar('Pre-filter results', $aSearchResults); $aOSMIDDone = array(); $aClassTypeNameDone = array(); $aToFilter = $aSearchResults; $aSearchResults = array(); $bFirst = true; foreach ($aToFilter as $aResult) { $this->aExcludePlaceIDs[$aResult['place_id']] = $aResult['place_id']; if ($bFirst) { $fLat = $aResult['lat']; $fLon = $aResult['lon']; if (isset($aResult['zoom'])) $iZoom = $aResult['zoom']; $bFirst = false; } if (!$this->oPlaceLookup->doDeDupe() || (!isset($aOSMIDDone[$aResult['osm_type'].$aResult['osm_id']]) && !isset($aClassTypeNameDone[$aResult['osm_type'].$aResult['class'].$aResult['type'].$aResult['name'].$aResult['admin_level']])) ) { $aOSMIDDone[$aResult['osm_type'].$aResult['osm_id']] = true; $aClassTypeNameDone[$aResult['osm_type'].$aResult['class'].$aResult['type'].$aResult['name'].$aResult['admin_level']] = true; $aSearchResults[] = $aResult; } // Absolute limit on number of results if (count($aSearchResults) >= $this->iFinalLimit) break; } Debug::printVar('Post-filter results', $aSearchResults); return $aSearchResults; } // end lookup() public function debugInfo() { return array( 'Query' => $this->sQuery, 'Structured query' => $this->aStructuredQuery, 'Name keys' => Debug::fmtArrayVals($this->aLangPrefOrder), 'Excluded place IDs' => Debug::fmtArrayVals($this->aExcludePlaceIDs), 'Try reversed query'=> $this->bReverseInPlan, 'Limit (for searches)' => $this->iLimit, 'Limit (for results)'=> $this->iFinalLimit, 'Country codes' => Debug::fmtArrayVals($this->aCountryCodes), 'Bounded search' => $this->bBoundedSearch, 'Viewbox' => Debug::fmtArrayVals($this->aViewBox), 'Route points' => Debug::fmtArrayVals($this->aRoutePoints), 'Route width' => $this->aRouteWidth, 'Max rank' => $this->iMaxRank, 'Min address rank' => $this->iMinAddressRank, 'Max address rank' => $this->iMaxAddressRank, 'Address rank list' => Debug::fmtArrayVals($this->aAddressRankList) ); } } // end class