1 # SPDX-License-Identifier: GPL-3.0-or-later
3 # This file is part of Nominatim. (https://nominatim.org)
5 # Copyright (C) 2025 by the Nominatim developer community.
6 # For a full list of authors see the git log.
8 Complex datatypes used by the Nominatim API.
10 from typing import Optional, Union, Tuple, NamedTuple, TypeVar, Type, Dict, \
12 from collections import abc
17 from struct import unpack
18 from binascii import unhexlify
20 from .errors import UsageError
23 @dataclasses.dataclass
25 """ Reference a place by Nominatim's internal ID.
27 A PlaceID may reference place from the main table placex, from
28 the interpolation tables or the postcode tables. Place IDs are not
29 stable between installations. You may use this type theefore only
30 with place IDs obtained from the same database.
34 The internal ID of the place to reference.
38 @dataclasses.dataclass
40 """ Reference a place by its OSM ID and potentially the basic category.
42 The OSM ID may refer to places in the main table placex and OSM
46 """ OSM type of the object. Must be one of `N`(node), `W`(way) or
50 """ The OSM ID of the object.
52 osm_class: Optional[str] = None
53 """ The same OSM object may appear multiple times in the database under
54 different categories. The optional class parameter allows to distinguish
55 the different categories and corresponds to the key part of the category.
56 If there are multiple objects in the database and `osm_class` is
57 left out, then one of the objects is returned at random.
60 def __post_init__(self) -> None:
61 if self.osm_type not in ('N', 'W', 'R'):
62 raise ValueError(f"Illegal OSM type '{self.osm_type}'. Must be one of N, W, R.")
64 def class_as_housenumber(self) -> Optional[int]:
65 """ Interpret the class property as a housenumber and return it.
67 If the OSM ID points to an interpolation, then the class may be
68 a number pointing to the exact number requested. This function
69 returns the housenumber as an int, if class is set and is a number.
71 if self.osm_class and self.osm_class.isdigit():
72 return int(self.osm_class)
76 PlaceRef = Union[PlaceID, OsmID]
79 class Point(NamedTuple):
80 """ A geographic point in WGS84 projection.
86 def lat(self) -> float:
87 """ Return the latitude of the point.
92 def lon(self) -> float:
93 """ Return the longitude of the point.
97 def to_geojson(self) -> str:
98 """ Return the point in GeoJSON format.
100 return f'{{"type": "Point","coordinates": [{self.x}, {self.y}]}}'
103 def from_wkb(wkb: Union[str, bytes]) -> 'Point':
104 """ Create a point from EWKB as returned from the database.
106 if isinstance(wkb, str):
109 raise ValueError(f"Point wkb has unexpected length {len(wkb)}")
111 gtype, srid, x, y = unpack('>iidd', wkb[1:])
113 gtype, srid, x, y = unpack('<iidd', wkb[1:])
115 raise ValueError("WKB has unknown endian value.")
117 if gtype != 0x20000001:
118 raise ValueError("WKB must be a point geometry.")
120 raise ValueError("Only WGS84 WKB supported.")
125 def from_param(inp: Any) -> 'Point':
126 """ Create a point from an input parameter. The parameter
127 may be given as a point, a string or a sequence of
128 strings or floats. Raises a UsageError if the format is
131 if isinstance(inp, Point):
135 if isinstance(inp, str):
137 elif isinstance(inp, abc.Sequence):
141 raise UsageError('Point parameter needs 2 coordinates.')
143 x, y = filter(math.isfinite, map(float, seq))
144 except ValueError as exc:
145 raise UsageError('Point parameter needs to be numbers.') from exc
147 if not -180 <= x <= 180 or not -90 <= y <= 90.0:
148 raise UsageError('Point coordinates invalid.')
152 def to_wkt(self) -> str:
153 """ Return the WKT representation of the point.
155 return f'POINT({self.x} {self.y})'
158 AnyPoint = Union[Point, Tuple[float, float]]
160 WKB_BBOX_HEADER_LE = b'\x01\x03\x00\x00\x20\xE6\x10\x00\x00\x01\x00\x00\x00\x05\x00\x00\x00'
161 WKB_BBOX_HEADER_BE = b'\x00\x20\x00\x00\x03\x00\x00\x10\xe6\x00\x00\x00\x01\x00\x00\x00\x05'
165 """ A bounding box in WGS84 projection.
167 The coordinates are available as an array in the 'coord'
168 property in the order (minx, miny, maxx, maxy).
170 def __init__(self, minx: float, miny: float, maxx: float, maxy: float) -> None:
171 """ Create a new bounding box with the given coordinates in WGS84
174 self.coords = (minx, miny, maxx, maxy)
177 def minlat(self) -> float:
178 """ Southern-most latitude, corresponding to the minimum y coordinate.
180 return self.coords[1]
183 def maxlat(self) -> float:
184 """ Northern-most latitude, corresponding to the maximum y coordinate.
186 return self.coords[3]
189 def minlon(self) -> float:
190 """ Western-most longitude, corresponding to the minimum x coordinate.
192 return self.coords[0]
195 def maxlon(self) -> float:
196 """ Eastern-most longitude, corresponding to the maximum x coordinate.
198 return self.coords[2]
201 def area(self) -> float:
202 """ Return the area of the box in WGS84.
204 return (self.coords[2] - self.coords[0]) * (self.coords[3] - self.coords[1])
206 def contains(self, pt: Point) -> bool:
207 """ Check if the point is inside or on the boundary of the box.
209 return self.coords[0] <= pt[0] and self.coords[1] <= pt[1]\
210 and self.coords[2] >= pt[0] and self.coords[3] >= pt[1]
212 def to_wkt(self) -> str:
213 """ Return the WKT representation of the Bbox. This
214 is a simple polygon with four points.
216 return 'POLYGON(({0} {1},{0} {3},{2} {3},{2} {1},{0} {1}))'\
217 .format(*self.coords)
220 def from_wkb(wkb: Union[None, str, bytes]) -> 'Optional[Bbox]':
221 """ Create a Bbox from a bounding box polygon as returned by
222 the database. Returns `None` if the input value is None.
227 if isinstance(wkb, str):
231 raise ValueError("WKB must be a bounding box polygon")
232 if wkb.startswith(WKB_BBOX_HEADER_LE):
233 x1, y1, _, _, x2, y2 = unpack('<dddddd', wkb[17:65])
234 elif wkb.startswith(WKB_BBOX_HEADER_BE):
235 x1, y1, _, _, x2, y2 = unpack('>dddddd', wkb[17:65])
237 raise ValueError("WKB has wrong header")
239 return Bbox(min(x1, x2), min(y1, y2), max(x1, x2), max(y1, y2))
242 def from_point(pt: Point, buffer: float) -> 'Bbox':
243 """ Return a Bbox around the point with the buffer added to all sides.
245 return Bbox(pt[0] - buffer, pt[1] - buffer,
246 pt[0] + buffer, pt[1] + buffer)
249 def from_param(inp: Any) -> 'Bbox':
250 """ Return a Bbox from an input parameter. The box may be
251 given as a Bbox, a string or a list or strings or integer.
252 Raises a UsageError if the format is incorrect.
254 if isinstance(inp, Bbox):
258 if isinstance(inp, str):
260 elif isinstance(inp, abc.Sequence):
264 raise UsageError('Bounding box parameter needs 4 coordinates.')
266 x1, y1, x2, y2 = filter(math.isfinite, map(float, seq))
267 except ValueError as exc:
268 raise UsageError('Bounding box parameter needs to be numbers.') from exc
270 x1 = min(180, max(-180, x1))
271 x2 = min(180, max(-180, x2))
272 y1 = min(90, max(-90, y1))
273 y2 = min(90, max(-90, y2))
275 if x1 == x2 or y1 == y2:
276 raise UsageError('Bounding box with invalid parameters.')
278 return Bbox(min(x1, x2), min(y1, y2), max(x1, x2), max(y1, y2))
281 class GeometryFormat(enum.Flag):
282 """ All search functions support returning the full geometry of a place in
283 various formats. The internal geometry is converted by PostGIS to
284 the desired format and then returned as a string. It is possible to
285 request multiple formats at the same time.
288 """ No geometry requested. Alias for a empty flag.
290 GEOJSON = enum.auto()
292 [GeoJSON](https://geojson.org/) format
296 [KML](https://en.wikipedia.org/wiki/Keyhole_Markup_Language) format
300 [SVG](http://www.w3.org/TR/SVG/paths.html) format
304 [WKT](https://en.wikipedia.org/wiki/Well-known_text_representation_of_geometry) format
308 class DataLayer(enum.Flag):
309 """ The `DataLayer` flag type defines the layers that can be selected
310 for reverse and forward search.
312 ADDRESS = enum.auto()
313 """ The address layer contains all places relevant for addresses:
314 fully qualified addresses with a house number (or a house name equivalent,
315 for some addresses) and places that can be part of an address like
316 roads, cities, states.
319 """ Layer for points of interest like shops, restaurants but also
320 recycling bins or postboxes.
322 RAILWAY = enum.auto()
323 """ Layer with railway features including tracks and other infrastructure.
324 Note that in Nominatim's standard configuration, only very few railway
325 features are imported into the database. Thus a custom configuration
326 is required to make full use of this layer.
328 NATURAL = enum.auto()
329 """ Layer with natural features like rivers, lakes and mountains.
331 MANMADE = enum.auto()
332 """ Layer with other human-made features and boundaries. This layer is
333 the catch-all and includes all features not covered by the other
334 layers. A typical example for this layer are national park boundaries.
338 class QueryStatistics(dict[str, Any]):
339 """ A specialised dictionary for collecting query statistics.
342 def __enter__(self) -> 'QueryStatistics':
343 self.log_time('start')
346 def __exit__(self, *_: Any) -> None:
348 self['total_time'] = (self['end'] - self['start']).total_seconds()
349 if 'start_query' in self:
350 self['wait_time'] = (self['start_query'] - self['start']).total_seconds()
352 self['wait_time'] = self['total_time']
353 self['start_query'] = self['end']
354 self['query_time'] = self['total_time'] - self['wait_time']
356 def __missing__(self, key: str) -> str:
359 def log_time(self, key: str) -> None:
360 self[key] = dt.datetime.now(tz=dt.timezone.utc)
364 """ Null object to use, when no query statistics are requested.
367 def __enter__(self) -> 'NoQueryStats':
370 def __exit__(self, *_: Any) -> None:
373 def __setitem__(self, key: str, value: Any) -> None:
376 def log_time(self, key: str) -> None:
380 def format_country(cc: Any) -> List[str]:
381 """ Extract a list of country codes from the input which may be either
382 a string or list of strings. Filters out all values that are not
386 if isinstance(cc, str):
387 clist = cc.split(',')
388 elif isinstance(cc, abc.Sequence):
391 raise UsageError("Parameter 'country' needs to be a comma-separated list "
392 "or a Python list of strings.")
394 return [cc.lower() for cc in clist if isinstance(cc, str) and len(cc) == 2]
397 def format_excluded(ids: Any) -> List[int]:
398 """ Extract a list of place ids from the input which may be either
399 a string or a list of strings or ints. Ignores empty value but
400 throws a UserError on anything that cannot be converted to int.
403 if isinstance(ids, str):
404 plist = [s.strip() for s in ids.split(',')]
405 elif isinstance(ids, abc.Sequence):
408 raise UsageError("Parameter 'excluded' needs to be a comma-separated list "
409 "or a Python list of numbers.")
410 if not all(isinstance(i, int) or
411 (isinstance(i, str) and (not i or i.isdigit())) for i in plist):
412 raise UsageError("Parameter 'excluded' only takes place IDs.")
414 return [int(id) for id in plist if id] or [0]
417 def format_categories(categories: List[Tuple[str, str]]) -> List[Tuple[str, str]]:
418 """ Extract a list of categories. Currently a noop.
423 TParam = TypeVar('TParam', bound='LookupDetails')
426 @dataclasses.dataclass
428 """ Collection of parameters that define which kind of details are
429 returned with a lookup or details result.
431 geometry_output: GeometryFormat = GeometryFormat.NONE
432 """ Add the full geometry of the place to the result. Multiple
433 formats may be selected. Note that geometries can become quite large.
435 address_details: bool = False
436 """ Get detailed information on the places that make up the address
439 linked_places: bool = False
440 """ Get detailed information on the places that link to the result.
442 parented_places: bool = False
443 """ Get detailed information on all places that this place is a parent
444 for, i.e. all places for which it provides the address details.
445 Only POI places can have parents.
447 entrances: bool = False
448 """ Get detailed information about the tagged entrances for the result.
450 keywords: bool = False
451 """ Add information about the search terms used for this place.
453 geometry_simplification: float = 0.0
454 """ Simplification factor for a geometry in degrees WGS. A factor of
455 0.0 means the original geometry is kept. The higher the value, the
456 more the geometry gets simplified.
458 query_stats: Union[QueryStatistics, NoQueryStats] = \
459 dataclasses.field(default_factory=NoQueryStats)
460 """ Optional QueryStatistics object collecting information about
461 runtime behaviour of the call.
465 def from_kwargs(cls: Type[TParam], kwargs: Dict[str, Any]) -> TParam:
466 """ Load the data fields of the class from a dictionary.
467 Unknown entries in the dictionary are ignored, missing ones
468 get the default setting.
470 The function supports type checking and throws a UsageError
471 when the value does not fit.
473 def _check_field(v: Any, field: 'dataclasses.Field[Any]') -> Any:
475 return field.default_factory() \
476 if field.default_factory != dataclasses.MISSING \
478 if field.metadata and 'transform' in field.metadata:
479 return field.metadata['transform'](v)
480 if not isinstance(v, field.type): # type: ignore[arg-type]
481 raise UsageError(f"Parameter '{field.name}' needs to be of {field.type!s}.")
484 return cls(**{f.name: _check_field(kwargs[f.name], f)
485 for f in dataclasses.fields(cls) if f.name in kwargs})
488 @dataclasses.dataclass
489 class ReverseDetails(LookupDetails):
490 """ Collection of parameters for the reverse call.
493 max_rank: int = dataclasses.field(default=30,
494 metadata={'transform': lambda v: max(0, min(v, 30))})
495 """ Highest address rank to return.
498 layers: DataLayer = DataLayer.ADDRESS | DataLayer.POI
499 """ Filter which kind of data to include.
503 @dataclasses.dataclass
504 class SearchDetails(LookupDetails):
505 """ Collection of parameters for the search call.
507 max_results: int = 10
508 """ Maximum number of results to be returned. The actual number of results
512 min_rank: int = dataclasses.field(default=0,
513 metadata={'transform': lambda v: max(0, min(v, 30))})
514 """ Lowest address rank to return.
517 max_rank: int = dataclasses.field(default=30,
518 metadata={'transform': lambda v: max(0, min(v, 30))})
519 """ Highest address rank to return.
522 layers: Optional[DataLayer] = dataclasses.field(default=None,
523 metadata={'transform': lambda r: r})
524 """ Filter which kind of data to include. When 'None' (the default) then
525 filtering by layers is disabled.
528 countries: List[str] = dataclasses.field(default_factory=list,
529 metadata={'transform': format_country})
530 """ Restrict search results to the given countries. An empty list (the
531 default) will disable this filter.
534 excluded: List[int] = dataclasses.field(default_factory=list,
535 metadata={'transform': format_excluded})
536 """ List of OSM objects to exclude from the results. Currently only
537 works when the internal place ID is given.
538 An empty list (the default) will disable this filter.
541 viewbox: Optional[Bbox] = dataclasses.field(default=None,
542 metadata={'transform': Bbox.from_param})
543 """ Focus the search on a given map area.
546 bounded_viewbox: bool = False
547 """ Use 'viewbox' as a filter and restrict results to places within the
551 near: Optional[Point] = dataclasses.field(default=None,
552 metadata={'transform': Point.from_param})
553 """ Order results by distance to the given point.
556 near_radius: Optional[float] = dataclasses.field(default=None,
557 metadata={'transform': lambda r: r})
558 """ Use near point as a filter and drop results outside the given
559 radius. Radius is given in degrees WSG84.
562 categories: List[Tuple[str, str]] = dataclasses.field(default_factory=list,
563 metadata={'transform': format_categories})
564 """ Restrict search to places with one of the given class/type categories.
565 An empty list (the default) will disable this filter.
568 viewbox_x2: Optional[Bbox] = None
570 def __post_init__(self) -> None:
571 if self.viewbox is not None:
572 xext = (self.viewbox.maxlon - self.viewbox.minlon)/2
573 yext = (self.viewbox.maxlat - self.viewbox.minlat)/2
574 self.viewbox_x2 = Bbox(self.viewbox.minlon - xext, self.viewbox.minlat - yext,
575 self.viewbox.maxlon + xext, self.viewbox.maxlat + yext)
577 def restrict_min_max_rank(self, new_min: int, new_max: int) -> None:
578 """ Change the min_rank and max_rank fields to respect the
581 assert new_min <= new_max
582 self.min_rank = max(self.min_rank, new_min)
583 self.max_rank = min(self.max_rank, new_max)
585 def is_impossible(self) -> bool:
586 """ Check if the parameter configuration is contradictionary and
587 cannot yield any results.
589 return (self.min_rank > self.max_rank
590 or (self.bounded_viewbox
591 and self.viewbox is not None and self.near is not None
592 and self.viewbox.contains(self.near))
593 or (self.layers is not None and not self.layers)
594 or (self.max_rank <= 4 and
595 self.layers is not None and not self.layers & DataLayer.ADDRESS))
597 def layer_enabled(self, layer: DataLayer) -> bool:
598 """ Check if the given layer has been chosen. Also returns
599 true when layer restriction has been disabled completely.
601 return self.layers is None or bool(self.layers & layer)
604 @dataclasses.dataclass
605 class EntranceDetails:
606 """ Reference a place by its OSM ID and potentially the basic category.
608 The OSM ID may refer to places in the main table placex and OSM
612 """ The OSM ID of the object.
615 """ The value of the OSM entrance tag (i.e. yes, main, secondary, etc.).
618 """ The location of the entrance node.
620 extratags: Dict[str, str]
621 """ The other tags associated with the entrance node.