1 # SPDX-License-Identifier: GPL-3.0-or-later
3 # This file is part of Nominatim. (https://nominatim.org)
5 # Copyright (C) 2025 by the Nominatim developer community.
6 # For a full list of authors see the git log.
8 Complex datatypes used by the Nominatim API.
10 from typing import Optional, Union, Tuple, NamedTuple, TypeVar, Type, Dict, \
12 from collections import abc
17 from struct import unpack
18 from binascii import unhexlify
20 from .errors import UsageError
23 @dataclasses.dataclass
25 """ Reference a place by Nominatim's internal ID.
27 A PlaceID may reference place from the main table placex, from
28 the interpolation tables or the postcode tables. Place IDs are not
29 stable between installations. You may use this type theefore only
30 with place IDs obtained from the same database.
34 The internal ID of the place to reference.
38 @dataclasses.dataclass
40 """ Reference a place by its OSM ID and potentially the basic category.
42 The OSM ID may refer to places in the main table placex and OSM
46 """ OSM type of the object. Must be one of `N`(node), `W`(way) or
50 """ The OSM ID of the object.
52 osm_class: Optional[str] = None
53 """ The same OSM object may appear multiple times in the database under
54 different categories. The optional class parameter allows to distinguish
55 the different categories and corresponds to the key part of the category.
56 If there are multiple objects in the database and `osm_class` is
57 left out, then one of the objects is returned at random.
60 def __post_init__(self) -> None:
61 if self.osm_type not in ('N', 'W', 'R'):
62 raise ValueError(f"Illegal OSM type '{self.osm_type}'. Must be one of N, W, R.")
64 def class_as_housenumber(self) -> Optional[int]:
65 """ Interpret the class property as a housenumber and return it.
67 If the OSM ID points to an interpolation, then the class may be
68 a number pointing to the exact number requested. This function
69 returns the housenumber as an int, if class is set and is a number.
71 if self.osm_class and self.osm_class.isdigit():
72 return int(self.osm_class)
76 PlaceRef = Union[PlaceID, OsmID]
79 class Point(NamedTuple):
80 """ A geographic point in WGS84 projection.
86 def lat(self) -> float:
87 """ Return the latitude of the point.
92 def lon(self) -> float:
93 """ Return the longitude of the point.
97 def to_geojson(self) -> str:
98 """ Return the point in GeoJSON format.
100 return f'{{"type": "Point","coordinates": [{self.x}, {self.y}]}}'
103 def from_wkb(wkb: Union[str, bytes]) -> 'Point':
104 """ Create a point from EWKB as returned from the database.
106 if isinstance(wkb, str):
109 raise ValueError(f"Point wkb has unexpected length {len(wkb)}")
111 gtype, srid, x, y = unpack('>iidd', wkb[1:])
113 gtype, srid, x, y = unpack('<iidd', wkb[1:])
115 raise ValueError("WKB has unknown endian value.")
117 if gtype != 0x20000001:
118 raise ValueError("WKB must be a point geometry.")
120 raise ValueError("Only WGS84 WKB supported.")
125 def from_param(inp: Any) -> 'Point':
126 """ Create a point from an input parameter. The parameter
127 may be given as a point, a string or a sequence of
128 strings or floats. Raises a UsageError if the format is
131 if isinstance(inp, Point):
135 if isinstance(inp, str):
137 elif isinstance(inp, abc.Sequence):
141 raise UsageError('Point parameter needs 2 coordinates.')
143 x, y = filter(math.isfinite, map(float, seq))
144 except ValueError as exc:
145 raise UsageError('Point parameter needs to be numbers.') from exc
147 if not -180 <= x <= 180 or not -90 <= y <= 90.0:
148 raise UsageError('Point coordinates invalid.')
152 def to_wkt(self) -> str:
153 """ Return the WKT representation of the point.
155 return f'POINT({self.x} {self.y})'
158 AnyPoint = Union[Point, Tuple[float, float]]
160 WKB_BBOX_HEADER_LE = b'\x01\x03\x00\x00\x20\xE6\x10\x00\x00\x01\x00\x00\x00\x05\x00\x00\x00'
161 WKB_BBOX_HEADER_BE = b'\x00\x20\x00\x00\x03\x00\x00\x10\xe6\x00\x00\x00\x01\x00\x00\x00\x05'
165 """ A bounding box in WGS84 projection.
167 The coordinates are available as an array in the 'coord'
168 property in the order (minx, miny, maxx, maxy).
170 def __init__(self, minx: float, miny: float, maxx: float, maxy: float) -> None:
171 """ Create a new bounding box with the given coordinates in WGS84
174 self.coords = (minx, miny, maxx, maxy)
177 def minlat(self) -> float:
178 """ Southern-most latitude, corresponding to the minimum y coordinate.
180 return self.coords[1]
183 def maxlat(self) -> float:
184 """ Northern-most latitude, corresponding to the maximum y coordinate.
186 return self.coords[3]
189 def minlon(self) -> float:
190 """ Western-most longitude, corresponding to the minimum x coordinate.
192 return self.coords[0]
195 def maxlon(self) -> float:
196 """ Eastern-most longitude, corresponding to the maximum x coordinate.
198 return self.coords[2]
201 def area(self) -> float:
202 """ Return the area of the box in WGS84.
204 return (self.coords[2] - self.coords[0]) * (self.coords[3] - self.coords[1])
206 def contains(self, pt: Point) -> bool:
207 """ Check if the point is inside or on the boundary of the box.
209 return self.coords[0] <= pt[0] and self.coords[1] <= pt[1]\
210 and self.coords[2] >= pt[0] and self.coords[3] >= pt[1]
212 def to_wkt(self) -> str:
213 """ Return the WKT representation of the Bbox. This
214 is a simple polygon with four points.
216 return 'POLYGON(({0} {1},{0} {3},{2} {3},{2} {1},{0} {1}))'\
217 .format(*self.coords)
220 def from_wkb(wkb: Union[None, str, bytes]) -> 'Optional[Bbox]':
221 """ Create a Bbox from a bounding box polygon as returned by
222 the database. Returns `None` if the input value is None.
227 if isinstance(wkb, str):
231 raise ValueError("WKB must be a bounding box polygon")
232 if wkb.startswith(WKB_BBOX_HEADER_LE):
233 x1, y1, _, _, x2, y2 = unpack('<dddddd', wkb[17:65])
234 elif wkb.startswith(WKB_BBOX_HEADER_BE):
235 x1, y1, _, _, x2, y2 = unpack('>dddddd', wkb[17:65])
237 raise ValueError("WKB has wrong header")
239 return Bbox(min(x1, x2), min(y1, y2), max(x1, x2), max(y1, y2))
242 def from_point(pt: Point, buffer: float) -> 'Bbox':
243 """ Return a Bbox around the point with the buffer added to all sides.
245 return Bbox(pt[0] - buffer, pt[1] - buffer,
246 pt[0] + buffer, pt[1] + buffer)
249 def from_param(inp: Any) -> 'Bbox':
250 """ Return a Bbox from an input parameter. The box may be
251 given as a Bbox, a string or a list or strings or integer.
252 Raises a UsageError if the format is incorrect.
254 if isinstance(inp, Bbox):
258 if isinstance(inp, str):
260 elif isinstance(inp, abc.Sequence):
264 raise UsageError('Bounding box parameter needs 4 coordinates.')
266 x1, y1, x2, y2 = filter(math.isfinite, map(float, seq))
267 except ValueError as exc:
268 raise UsageError('Bounding box parameter needs to be numbers.') from exc
270 x1 = min(180, max(-180, x1))
271 x2 = min(180, max(-180, x2))
272 y1 = min(90, max(-90, y1))
273 y2 = min(90, max(-90, y2))
275 if x1 == x2 or y1 == y2:
276 raise UsageError('Bounding box with invalid parameters.')
278 return Bbox(min(x1, x2), min(y1, y2), max(x1, x2), max(y1, y2))
281 class GeometryFormat(enum.Flag):
282 """ All search functions support returning the full geometry of a place in
283 various formats. The internal geometry is converted by PostGIS to
284 the desired format and then returned as a string. It is possible to
285 request multiple formats at the same time.
288 """ No geometry requested. Alias for a empty flag.
290 GEOJSON = enum.auto()
292 [GeoJSON](https://geojson.org/) format
296 [KML](https://en.wikipedia.org/wiki/Keyhole_Markup_Language) format
300 [SVG](http://www.w3.org/TR/SVG/paths.html) format
304 [WKT](https://en.wikipedia.org/wiki/Well-known_text_representation_of_geometry) format
308 class DataLayer(enum.Flag):
309 """ The `DataLayer` flag type defines the layers that can be selected
310 for reverse and forward search.
312 ADDRESS = enum.auto()
313 """ The address layer contains all places relevant for addresses:
314 fully qualified addresses with a house number (or a house name equivalent,
315 for some addresses) and places that can be part of an address like
316 roads, cities, states.
319 """ Layer for points of interest like shops, restaurants but also
320 recycling bins or postboxes.
322 RAILWAY = enum.auto()
323 """ Layer with railway features including tracks and other infrastructure.
324 Note that in Nominatim's standard configuration, only very few railway
325 features are imported into the database. Thus a custom configuration
326 is required to make full use of this layer.
328 NATURAL = enum.auto()
329 """ Layer with natural features like rivers, lakes and mountains.
331 MANMADE = enum.auto()
332 """ Layer with other human-made features and boundaries. This layer is
333 the catch-all and includes all features not covered by the other
334 layers. A typical example for this layer are national park boundaries.
338 class QueryStatistics(dict[str, Any]):
339 """ A specialised dictionary for collecting query statistics.
342 def __enter__(self) -> 'QueryStatistics':
343 self.log_time('start_function')
346 def __exit__(self, *_: Any) -> None:
347 self.log_time('end_function')
348 self['total_time'] = (self['end_function'] - self['start_function']) \
349 / dt.timedelta(microseconds=1)
350 if 'start_query' in self:
351 self['wait_time'] = (self['start_query'] - self['start_function']) \
352 / dt.timedelta(microseconds=1)
354 self['wait_time'] = 0
355 self['query_time'] = self['total_time'] - self['wait_time']
357 def __missing__(self, key: str) -> str:
360 def log_time(self, key: str) -> None:
361 self[key] = dt.datetime.now(tz=dt.timezone.utc)
365 """ Null object to use, when no query statistics are requested.
368 def __enter__(self) -> 'NoQueryStats':
371 def __exit__(self, *_: Any) -> None:
374 def __setitem__(self, key: str, value: Any) -> None:
377 def log_time(self, key: str) -> None:
381 def format_country(cc: Any) -> List[str]:
382 """ Extract a list of country codes from the input which may be either
383 a string or list of strings. Filters out all values that are not
387 if isinstance(cc, str):
388 clist = cc.split(',')
389 elif isinstance(cc, abc.Sequence):
392 raise UsageError("Parameter 'country' needs to be a comma-separated list "
393 "or a Python list of strings.")
395 return [cc.lower() for cc in clist if isinstance(cc, str) and len(cc) == 2]
398 def format_excluded(ids: Any) -> List[int]:
399 """ Extract a list of place ids from the input which may be either
400 a string or a list of strings or ints. Ignores empty value but
401 throws a UserError on anything that cannot be converted to int.
404 if isinstance(ids, str):
405 plist = [s.strip() for s in ids.split(',')]
406 elif isinstance(ids, abc.Sequence):
409 raise UsageError("Parameter 'excluded' needs to be a comma-separated list "
410 "or a Python list of numbers.")
411 if not all(isinstance(i, int) or
412 (isinstance(i, str) and (not i or i.isdigit())) for i in plist):
413 raise UsageError("Parameter 'excluded' only takes place IDs.")
415 return [int(id) for id in plist if id] or [0]
418 def format_categories(categories: List[Tuple[str, str]]) -> List[Tuple[str, str]]:
419 """ Extract a list of categories. Currently a noop.
424 TParam = TypeVar('TParam', bound='LookupDetails')
427 @dataclasses.dataclass
429 """ Collection of parameters that define which kind of details are
430 returned with a lookup or details result.
432 geometry_output: GeometryFormat = GeometryFormat.NONE
433 """ Add the full geometry of the place to the result. Multiple
434 formats may be selected. Note that geometries can become quite large.
436 address_details: bool = False
437 """ Get detailed information on the places that make up the address
440 linked_places: bool = False
441 """ Get detailed information on the places that link to the result.
443 parented_places: bool = False
444 """ Get detailed information on all places that this place is a parent
445 for, i.e. all places for which it provides the address details.
446 Only POI places can have parents.
448 entrances: bool = False
449 """ Get detailed information about the tagged entrances for the result.
451 keywords: bool = False
452 """ Add information about the search terms used for this place.
454 geometry_simplification: float = 0.0
455 """ Simplification factor for a geometry in degrees WGS. A factor of
456 0.0 means the original geometry is kept. The higher the value, the
457 more the geometry gets simplified.
459 query_stats: Union[QueryStatistics, NoQueryStats] = \
460 dataclasses.field(default_factory=NoQueryStats)
461 """ Optional QueryStatistics object collecting information about
462 runtime behaviour of the call.
466 def from_kwargs(cls: Type[TParam], kwargs: Dict[str, Any]) -> TParam:
467 """ Load the data fields of the class from a dictionary.
468 Unknown entries in the dictionary are ignored, missing ones
469 get the default setting.
471 The function supports type checking and throws a UsageError
472 when the value does not fit.
474 def _check_field(v: Any, field: 'dataclasses.Field[Any]') -> Any:
476 return field.default_factory() \
477 if field.default_factory != dataclasses.MISSING \
479 if field.metadata and 'transform' in field.metadata:
480 return field.metadata['transform'](v)
481 if not isinstance(v, field.type): # type: ignore[arg-type]
482 raise UsageError(f"Parameter '{field.name}' needs to be of {field.type!s}.")
485 return cls(**{f.name: _check_field(kwargs[f.name], f)
486 for f in dataclasses.fields(cls) if f.name in kwargs})
489 @dataclasses.dataclass
490 class ReverseDetails(LookupDetails):
491 """ Collection of parameters for the reverse call.
494 max_rank: int = dataclasses.field(default=30,
495 metadata={'transform': lambda v: max(0, min(v, 30))})
496 """ Highest address rank to return.
499 layers: DataLayer = DataLayer.ADDRESS | DataLayer.POI
500 """ Filter which kind of data to include.
504 @dataclasses.dataclass
505 class SearchDetails(LookupDetails):
506 """ Collection of parameters for the search call.
508 max_results: int = 10
509 """ Maximum number of results to be returned. The actual number of results
513 min_rank: int = dataclasses.field(default=0,
514 metadata={'transform': lambda v: max(0, min(v, 30))})
515 """ Lowest address rank to return.
518 max_rank: int = dataclasses.field(default=30,
519 metadata={'transform': lambda v: max(0, min(v, 30))})
520 """ Highest address rank to return.
523 layers: Optional[DataLayer] = dataclasses.field(default=None,
524 metadata={'transform': lambda r: r})
525 """ Filter which kind of data to include. When 'None' (the default) then
526 filtering by layers is disabled.
529 countries: List[str] = dataclasses.field(default_factory=list,
530 metadata={'transform': format_country})
531 """ Restrict search results to the given countries. An empty list (the
532 default) will disable this filter.
535 excluded: List[int] = dataclasses.field(default_factory=list,
536 metadata={'transform': format_excluded})
537 """ List of OSM objects to exclude from the results. Currently only
538 works when the internal place ID is given.
539 An empty list (the default) will disable this filter.
542 viewbox: Optional[Bbox] = dataclasses.field(default=None,
543 metadata={'transform': Bbox.from_param})
544 """ Focus the search on a given map area.
547 bounded_viewbox: bool = False
548 """ Use 'viewbox' as a filter and restrict results to places within the
552 near: Optional[Point] = dataclasses.field(default=None,
553 metadata={'transform': Point.from_param})
554 """ Order results by distance to the given point.
557 near_radius: Optional[float] = dataclasses.field(default=None,
558 metadata={'transform': lambda r: r})
559 """ Use near point as a filter and drop results outside the given
560 radius. Radius is given in degrees WSG84.
563 categories: List[Tuple[str, str]] = dataclasses.field(default_factory=list,
564 metadata={'transform': format_categories})
565 """ Restrict search to places with one of the given class/type categories.
566 An empty list (the default) will disable this filter.
569 viewbox_x2: Optional[Bbox] = None
571 def __post_init__(self) -> None:
572 if self.viewbox is not None:
573 xext = (self.viewbox.maxlon - self.viewbox.minlon)/2
574 yext = (self.viewbox.maxlat - self.viewbox.minlat)/2
575 self.viewbox_x2 = Bbox(self.viewbox.minlon - xext, self.viewbox.minlat - yext,
576 self.viewbox.maxlon + xext, self.viewbox.maxlat + yext)
578 def restrict_min_max_rank(self, new_min: int, new_max: int) -> None:
579 """ Change the min_rank and max_rank fields to respect the
582 assert new_min <= new_max
583 self.min_rank = max(self.min_rank, new_min)
584 self.max_rank = min(self.max_rank, new_max)
586 def is_impossible(self) -> bool:
587 """ Check if the parameter configuration is contradictionary and
588 cannot yield any results.
590 return (self.min_rank > self.max_rank
591 or (self.bounded_viewbox
592 and self.viewbox is not None and self.near is not None
593 and self.viewbox.contains(self.near))
594 or (self.layers is not None and not self.layers)
595 or (self.max_rank <= 4 and
596 self.layers is not None and not self.layers & DataLayer.ADDRESS))
598 def layer_enabled(self, layer: DataLayer) -> bool:
599 """ Check if the given layer has been chosen. Also returns
600 true when layer restriction has been disabled completely.
602 return self.layers is None or bool(self.layers & layer)
605 @dataclasses.dataclass
606 class EntranceDetails:
607 """ Reference a place by its OSM ID and potentially the basic category.
609 The OSM ID may refer to places in the main table placex and OSM
613 """ The OSM ID of the object.
616 """ The value of the OSM entrance tag (i.e. yes, main, secondary, etc.).
619 """ The location of the entrance node.
621 extratags: Dict[str, str]
622 """ The other tags associated with the entrance node.