From: Sarah Hoffmann <lonvia@denofr.de>
Date: Wed, 28 May 2025 12:13:49 +0000 (+0200)
Subject: release 5.1.0.post7
X-Git-Url: https://git.openstreetmap.org/nominatim.git/commitdiff_plain/HEAD?hp=84bac1bb4df234d0c25d94fb1abbf9289d2d55c1

release 5.1.0.post7
---

diff --git a/.flake8 b/.flake8
index 82d77ed3..1aae19dc 100644
--- a/.flake8
+++ b/.flake8
@@ -6,3 +6,6 @@ extend-ignore =
     E711
 per-file-ignores =
     __init__.py: F401
+    test/python/utils/test_json_writer.py: E131
+    **/conftest.py: E402
+    test/bdd/*: F821
diff --git a/.github/actions/setup-postgresql/action.yml b/.github/actions/setup-postgresql/action.yml
index 331d094a..7a9590c1 100644
--- a/.github/actions/setup-postgresql/action.yml
+++ b/.github/actions/setup-postgresql/action.yml
@@ -11,10 +11,8 @@ runs:
     steps:
         - name: Remove existing PostgreSQL
           run: |
+              sudo /usr/share/postgresql-common/pgdg/apt.postgresql.org.sh -y
               sudo apt-get purge -yq postgresql*
-              sudo apt install curl ca-certificates gnupg
-              curl https://www.postgresql.org/media/keys/ACCC4CF8.asc | gpg --dearmor | sudo tee /etc/apt/trusted.gpg.d/apt.postgresql.org.gpg >/dev/null
-              sudo sh -c 'echo "deb https://apt.postgresql.org/pub/repos/apt $(lsb_release -cs)-pgdg main" > /etc/apt/sources.list.d/pgdg.list'
               sudo apt-get update -qq
 
           shell: bash
diff --git a/.github/workflows/ci-tests.yml b/.github/workflows/ci-tests.yml
index 8b38d3dc..4d555416 100644
--- a/.github/workflows/ci-tests.yml
+++ b/.github/workflows/ci-tests.yml
@@ -37,10 +37,10 @@ jobs:
         needs: create-archive
         strategy:
             matrix:
-                flavour: ["ubuntu-20", "ubuntu-24"]
+                flavour: ["ubuntu-22", "ubuntu-24"]
                 include:
-                    - flavour: ubuntu-20
-                      ubuntu: 20
+                    - flavour: ubuntu-22
+                      ubuntu: 22
                       postgresql: 12
                       lua: '5.1'
                       dependencies: pip
@@ -68,26 +68,34 @@ jobs:
               with:
                   dependencies: ${{ matrix.dependencies }}
 
+            - uses: actions/cache@v4
+              with:
+                  path: |
+                     /usr/local/bin/osm2pgsql
+                  key: osm2pgsql-bin-22-1
+              if: matrix.ubuntu == '22'
+
             - name: Compile osm2pgsql
               run: |
-                  sudo apt-get install -y -qq libboost-system-dev libboost-filesystem-dev libexpat1-dev zlib1g-dev libbz2-dev libpq-dev libproj-dev libicu-dev liblua${LUA_VERSION}-dev lua-dkjson nlohmann-json3-dev 
-                  mkdir osm2pgsql-build
-                  cd osm2pgsql-build
-                  git clone https://github.com/osm2pgsql-dev/osm2pgsql
-                  mkdir build
-                  cd build
-                  cmake ../osm2pgsql
-                  make
-                  sudo make install
-                  cd ../..
-                  rm -rf osm2pgsql-build
-              if: matrix.ubuntu == '20'
+                  if [ ! -f /usr/local/bin/osm2pgsql ]; then
+                      sudo apt-get install -y -qq libboost-system-dev libboost-filesystem-dev libexpat1-dev zlib1g-dev libbz2-dev libpq-dev libproj-dev libicu-dev liblua${LUA_VERSION}-dev lua-dkjson nlohmann-json3-dev 
+                      mkdir osm2pgsql-build
+                      cd osm2pgsql-build
+                      git clone https://github.com/osm2pgsql-dev/osm2pgsql
+                      mkdir build
+                      cd build
+                      cmake ../osm2pgsql
+                      make
+                      sudo make install
+                      cd ../..
+                      rm -rf osm2pgsql-build
+                  else
+                      sudo apt-get install -y -qq libexpat1 liblua${LUA_VERSION}
+                  fi
+              if: matrix.ubuntu == '22'
               env:
                   LUA_VERSION: ${{ matrix.lua }}
 
-            - name: Install test prerequisites
-              run: ./venv/bin/pip install behave==1.2.6
-
             - name: Install test prerequisites (apt)
               run: sudo apt-get install -y -qq python3-pytest python3-pytest-asyncio uvicorn python3-falcon python3-aiosqlite python3-pyosmium
               if: matrix.dependencies == 'apt'
@@ -96,11 +104,14 @@ jobs:
               run: ./venv/bin/pip install pytest-asyncio falcon starlette asgi_lifespan aiosqlite osmium uvicorn
               if: matrix.dependencies == 'pip'
 
+            - name: Install test prerequisites
+              run: ./venv/bin/pip install pytest-bdd
+
             - name: Install latest flake8
               run: ./venv/bin/pip install -U flake8
 
             - name: Python linting
-              run: ../venv/bin/python -m flake8 src
+              run: ../venv/bin/python -m flake8 src test/python test/bdd
               working-directory: Nominatim
 
             - name: Install mypy and typechecking info
@@ -118,8 +129,8 @@ jobs:
 
             - name: BDD tests
               run: |
-                  ../../../venv/bin/python -m behave -DREMOVE_TEMPLATE=1 --format=progress3
-              working-directory: Nominatim/test/bdd
+                  ../venv/bin/python -m pytest test/bdd --nominatim-purge
+              working-directory: Nominatim
 
     install:
         runs-on: ubuntu-latest
@@ -185,9 +196,6 @@ jobs:
             - name: Prepare import environment
               run: |
                   mv Nominatim/test/testdb/apidb-test-data.pbf test.pbf
-                  mv Nominatim/settings/flex-base.lua flex-base.lua
-                  mv Nominatim/settings/import-extratags.lua import-extratags.lua
-                  mv Nominatim/settings/taginfo.lua taginfo.lua
                   rm -rf Nominatim
                   mkdir data-env-reverse
               working-directory: /home/nominatim
@@ -205,7 +213,7 @@ jobs:
               working-directory: /home/nominatim/nominatim-project
 
             - name: Print taginfo
-              run: lua taginfo.lua
+              run: lua ./nominatim-venv/lib/*/site-packages/nominatim_db/resources/lib-lua/taginfo.lua
               working-directory: /home/nominatim
 
             - name: Collect host OS information
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index b9bf2920..6c90cd3c 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -87,7 +87,6 @@ Checklist for releases:
 * [ ] increase versions in
   * `src/nominatim_api/version.py`
   * `src/nominatim_db/version.py`
-  * CMakeLists.txt
 * [ ] update `ChangeLog` (copy information from patch releases from release branch)
 * [ ] complete `docs/admin/Migration.md`
 * [ ] update EOL dates in `SECURITY.md`
@@ -114,3 +113,5 @@ Checklist for releases:
   * run `nominatim --version` to confirm correct version
 * [ ] tag new release and add a release on github.com
 * [ ] build pip packages and upload to pypi
+  * `make build`
+  * `twine upload dist/*`
diff --git a/ChangeLog b/ChangeLog
index b7609255..dff198eb 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,3 +1,47 @@
+5.1.0
+ * replace datrie with simple internal trie implementation
+ * add pattern-based postcode parser for queries,
+   postcodes no longer need to be present in OSM to be found
+ * take variants into account when computing token similarity
+ * add extratags output to geocodejson format
+ * fix default layer setting used for structured queries
+ * update abbreviation lists for Russian and English
+   (thanks @shoorick, @IvanShift, @mhsrn21)
+ * fix variant generation for Norwegian
+ * fix normalization around space-like characters
+ * improve postcode search and handling of postcodes in queries
+ * reorganise internal query structure and get rid of slow enums
+ * enable code linting for tests
+ * various code moderinsations in test code (thanks @eumiro)
+ * remove setting osm2pgsql location via config.lib_dir
+ * make SQL functions parallel save as far as possible (thanks @otbutz)
+ * various fixes and improvements to documentation (thanks @TuringVerified)
+
+5.0.0
+ * increase required versions for PostgreSQL (12+), PostGIS (3.0+)
+ * remove installation via cmake and debundle osm2pgsql
+ * remove deprecated PHP frontend
+ * remove deprecated legacy tokenizer
+ * add configurable pre-processing of queries
+ * add query pre-processor to split up Japanese addresses
+ * rewrite of osm2pgsql style implementation
+   (also adds support for osm2pgsql-themepark)
+ * reduce the number of SQL queries needed to complete a 'lookup' call
+ * improve computation of centroid for lines with only two points
+ * improve bbox output for postcode areas
+ * improve result order by returning the largest object when other things are
+   equal
+ * add fallback for reverse geocoding to default country tables
+ * exclude postcode areas from reverse geocoding
+ * disable search endpoint when database is reverse-only (regression)
+ * minor performance improvements to area split algorithm
+ * switch table and index creation to use autocommit mode to avoid deadlocks
+ * drop overly long ways during import
+ * restrict automatic migrations to versions 4.3+
+ * switch linting from pylint to flake8
+ * switch tests to use a wikimedia test file in the new CSV style
+ * various fixes and improvements to documentation
+
 4.5.0
  * allow building Nominatim as a pip package
  * make osm2pgsql building optional
diff --git a/Makefile b/Makefile
index 9e914850..d6423add 100644
--- a/Makefile
+++ b/Makefile
@@ -24,10 +24,10 @@ pytest:
 	pytest test/python
 
 lint:
-	flake8 src
+	flake8 src test/python test/bdd
 
 bdd:
-	cd test/bdd; behave -DREMOVE_TEMPLATE=1
+	pytest test/bdd --nominatim-purge
 
 # Documentation
 
diff --git a/README.md b/README.md
index 3b0f328a..54bdbf8e 100644
--- a/README.md
+++ b/README.md
@@ -27,18 +27,25 @@ can be found at nominatim.org as well.
 
 A quick summary of the necessary steps:
 
-1. Create a Python virtualenv and install the packages:
+
+1. Clone this git repository and download the country grid
+
+        git clone https://github.com/osm-search/Nominatim.git
+        wget -O Nominatim/data/country_osm_grid.sql.gz https://nominatim.org/data/country_grid.sql.gz
+
+2. Create a Python virtualenv and install the packages:
 
         python3 -m venv nominatim-venv
         ./nominatim-venv/bin/pip install packaging/nominatim-{api,db}
 
-2. Create a project directory, get OSM data and import:
+3. Create a project directory, get OSM data and import:
 
         mkdir nominatim-project
         cd nominatim-project
-        ../nominatim-venv/bin/nominatim import --osm-file <your planet file>
+        ../nominatim-venv/bin/nominatim import --osm-file <your planet file> 2>&1 | tee setup.log
+
 
-3. Start the webserver:
+4. Start the webserver:
 
         ./nominatim-venv/bin/pip install uvicorn falcon
         ../nominatim-venv/bin/nominatim serve
diff --git a/SECURITY.md b/SECURITY.md
index 3ec22cbd..98295e1f 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -9,10 +9,11 @@ versions.
 
 | Version | End of support for security updates |
 | ------- | ----------------------------------- |
+| 5.1.x   | 2027-04-01                          |
+| 5.0.x   | 2027-02-06                          |
 | 4.5.x   | 2026-09-12                          |
 | 4.4.x   | 2026-03-07                          |
 | 4.3.x   | 2025-09-07                          |
-| 4.2.x   | 2024-11-24                          |
 
 ## Reporting a Vulnerability
 
diff --git a/docs/admin/Deployment-Python.md b/docs/admin/Deployment-Python.md
index 5932f4e6..463e15c0 100644
--- a/docs/admin/Deployment-Python.md
+++ b/docs/admin/Deployment-Python.md
@@ -37,7 +37,7 @@ cd Nominatim
 ```
 
 The recommended way to deploy a Python ASGI application is to run
-the ASGI runner [uvicorn](https://uvicorn.org/)
+the ASGI runner [uvicorn](https://www.uvicorn.org/)
 together with [gunicorn](https://gunicorn.org/) HTTP server. We use
 Falcon here as the web framework.
 
diff --git a/docs/admin/Installation.md b/docs/admin/Installation.md
index dadbe460..2571de5d 100644
--- a/docs/admin/Installation.md
+++ b/docs/admin/Installation.md
@@ -26,7 +26,7 @@ For running Nominatim:
 
   * [PostgreSQL](https://www.postgresql.org) (12+ will work, 13+ strongly recommended)
   * [PostGIS](https://postgis.net) (3.0+ will work, 3.2+ strongly recommended)
-  * [osm2pgsql](https://osm2pgsql.org) (1.8+, optional when building with CMake)
+  * [osm2pgsql](https://osm2pgsql.org) (1.8+)
   * [Python 3](https://www.python.org/) (3.7+)
 
 Furthermore the following Python libraries are required:
@@ -37,7 +37,6 @@ Furthermore the following Python libraries are required:
   * [Jinja2](https://palletsprojects.com/p/jinja/)
   * [PyICU](https://pypi.org/project/PyICU/)
   * [PyYaml](https://pyyaml.org/) (5.1+)
-  * [datrie](https://github.com/pytries/datrie)
 
 These will be installed automatically when using pip installation.
 
@@ -102,6 +101,15 @@ you might consider setting:
 and even reduce `autovacuum_work_mem` further. This will reduce the amount
 of memory that autovacuum takes away from the import process.
 
+## Installing the latest release
+
+Nominatim is easiest installed directly from Pypi. Make sure you have installed
+osm2pgsql, PostgreSQL/PostGIS and libICU together with its header files.
+
+Then you can install Nominatim with:
+
+    pip install nominatim-db nominatim-api
+
 ## Downloading and building Nominatim
 
 ### Downloading the latest release
diff --git a/docs/admin/Migration.md b/docs/admin/Migration.md
index 13e6d7f5..becf2f7b 100644
--- a/docs/admin/Migration.md
+++ b/docs/admin/Migration.md
@@ -9,19 +9,15 @@ the following steps:
 * Update the frontend: `pip install -U nominatim-api`
 * (optionally) Restart updates
 
-If you are still using CMake for the installation of Nominatim, then you
-need to update the software in one step before migrating the database.
-It is not recommended to do this while the machine is serving requests.
-
 Below you find additional migrations and hints about other structural and
 breaking changes. **Please read them before running the migration.**
 
 !!! note
     If you are migrating from a version <4.3, you need to install 4.3
-    first and migrate to 4.3 first. Then you can migrate to the current
+    and migrate to 4.3 first. Then you can migrate to the current
     version. It is strongly recommended to do a reimport instead.
 
-## 4.5.0 -> master
+## 4.5.0 -> 5.0.0
 
 ### PHP frontend removed
 
@@ -33,6 +29,42 @@ needed. It currently omits a warning and does otherwise nothing. It will be
 removed in later versions of Nominatim. So make sure you remove it from your
 scripts.
 
+### CMake building removed
+
+Nominatim can now only be installed via pip. Please follow the installation
+instructions for the current version to change to pip.
+
+### osm2pgsql no longer vendored in
+
+Nominatim no longer ships its own version of osm2pgsql. Please install a
+stock version of osm2pgsql from your distribution. See the
+[installation instruction for osm2pgsql](https://osm2pgsql.org/doc/install.html)
+for details. A minimum version of 1.8 is required. The current stable versions
+of Ubuntu and Debian already ship with an appropriate versions. For older
+installation, you may have to compile a newer osm2pgsql yourself.
+
+### Legacy tokenizer removed
+
+The `legacy` tokenizer is no longer enabled. This tokenizer has been superseded
+by the `ICU` tokenizer a long time ago. In the unlikely case that your database
+still uses the `legacy` tokenizer, you must reimport your database.
+
+### osm2pgsql style overhauled
+
+There are some fundamental changes to how customized osm2pgsql styles should
+be written. The changes are mostly backwards compatible, i.e. custom styles
+should still work with the new implementation. The only exception is a
+customization of the `process_tags()` function. This function is no longer
+considered public and neither are the helper functions used in it.
+They currently still work but will be removed at some point. If you have
+been making changes to `process_tags`, please review your style and try
+to switch to the new convenience functions.
+
+For more information on the changes, see the
+[pull request](https://github.com/osm-search/Nominatim/pull/3615)
+and read the new
+[customization documentation](https://nominatim.org/release-docs/latest/customize/Import-Styles/).
+
 ## 4.4.0 -> 4.5.0
 
 ### New structure for Python packages
diff --git a/docs/admin/Update.md b/docs/admin/Update.md
index 5d1324d0..cdb79cae 100644
--- a/docs/admin/Update.md
+++ b/docs/admin/Update.md
@@ -68,10 +68,10 @@ the update interval no new data has been published yet, it will go to sleep
 until the next expected update and only then attempt to download the next batch.
 
 The one-time mode is particularly useful if you want to run updates continuously
-but need to schedule other work in between updates. For example, the main
-service at osm.org uses it, to regularly recompute postcodes -- a process that
-must not be run while updates are in progress. Its update script
-looks like this:
+but need to schedule other work in between updates. For example, you might
+want to regularly recompute postcodes -- a process that
+must not be run while updates are in progress. An update script refreshing
+postcodes regularly might look like this:
 
 ```sh
 #!/bin/bash
@@ -109,17 +109,19 @@ Unit=nominatim-updates.service
 WantedBy=multi-user.target
 ```
 
-And then a similar service definition: `/etc/systemd/system/nominatim-updates.service`:
+`OnUnitActiveSec` defines how often the individual update command is run.
+
+Then add a service definition for the timer in `/etc/systemd/system/nominatim-updates.service`:
 
 ```
 [Unit]
 Description=Single updates of Nominatim
 
 [Service]
-WorkingDirectory=/srv/nominatim
-ExecStart=nominatim replication --once
-StandardOutput=append:/var/log/nominatim-updates.log
-StandardError=append:/var/log/nominatim-updates.error.log
+WorkingDirectory=/srv/nominatim-project
+ExecStart=/srv/nominatim-venv/bin/nominatim replication --once
+StandardOutput=journald
+StandardError=inherit
 User=nominatim
 Group=nominatim
 Type=simple
@@ -128,9 +130,9 @@ Type=simple
 WantedBy=multi-user.target
 ```
 
-Replace the `WorkingDirectory` with your project directory. Also adapt user and
-group names as required. `OnUnitActiveSec` defines how often the individual
-update command is run.
+Replace the `WorkingDirectory` with your project directory. `ExecStart` points
+to the nominatim binary that was installed in your virtualenv earlier.
+Finally, you might need to adapt user and group names as required.
 
 Now activate the service and start the updates:
 
@@ -140,12 +142,13 @@ sudo systemctl enable nominatim-updates.timer
 sudo systemctl start nominatim-updates.timer
 ```
 
-You can stop future data updates, while allowing any current, in-progress
+You can stop future data updates while allowing any current, in-progress
 update steps to finish, by running `sudo systemctl stop
 nominatim-updates.timer` and waiting until `nominatim-updates.service` isn't
-running (`sudo systemctl is-active nominatim-updates.service`). Current output
-from the update can be seen like above (`systemctl status
-nominatim-updates.service`).
+running (`sudo systemctl is-active nominatim-updates.service`).
+
+To check the output from the update process, use journalctl: `journalctl -u
+nominatim-updates.service`
 
 
 #### Catch-up mode
@@ -155,13 +158,13 @@ all changes from the server until the database is up-to-date. The catch-up mode
 still respects the parameter `NOMINATIM_REPLICATION_MAX_DIFF`. It downloads and
 applies the changes in appropriate batches until all is done.
 
-The catch-up mode is foremost useful to bring the database up to speed after the
+The catch-up mode is foremost useful to bring the database up to date after the
 initial import. Give that the service usually is not in production at this
 point, you can temporarily be a bit more generous with the batch size and
 number of threads you use for the updates by running catch-up like this:
 
 ```
-cd /srv/nominatim
+cd /srv/nominatim-project
 NOMINATIM_REPLICATION_MAX_DIFF=5000 nominatim replication --catch-up --threads 15
 ```
 
@@ -173,13 +176,13 @@ replication catch-up at whatever interval you desire.
     When running scheduled updates with catch-up, it is a good idea to choose
     a replication source with an update frequency that is an order of magnitude
     lower. For example, if you want to update once a day, use an hourly updated
-    source. This makes sure that you don't miss an entire day of updates when
+    source. This ensures that you don't miss an entire day of updates when
     the source is unexpectedly late to publish its update.
 
     If you want to use the source with the same update frequency (e.g. a daily
     updated source with daily updates), use the
-    continuous update mode. It ensures to re-request the newest update until it
-    is published.
+    once mode together with a frequently run systemd script as described above.
+    It ensures to re-request the newest update until they have been published.
 
 
 #### Continuous updates
@@ -197,36 +200,3 @@ parameters:
 
 The update application keeps running forever and retrieves and applies
 new updates from the server as they are published.
-
-You can run this command as a simple systemd service. Create a service
-description like that in `/etc/systemd/system/nominatim-updates.service`:
-
-```
-[Unit]
-Description=Continuous updates of Nominatim
-
-[Service]
-WorkingDirectory=/srv/nominatim
-ExecStart=nominatim replication
-StandardOutput=append:/var/log/nominatim-updates.log
-StandardError=append:/var/log/nominatim-updates.error.log
-User=nominatim
-Group=nominatim
-Type=simple
-
-[Install]
-WantedBy=multi-user.target
-```
-
-Replace the `WorkingDirectory` with your project directory. Also adapt user
-and group names as required.
-
-Now activate the service and start the updates:
-
-```
-sudo systemctl daemon-reload
-sudo systemctl enable nominatim-updates
-sudo systemctl start nominatim-updates
-```
-
-
diff --git a/docs/api/Output.md b/docs/api/Output.md
index 75220cf5..a5ec933e 100644
--- a/docs/api/Output.md
+++ b/docs/api/Output.md
@@ -106,8 +106,11 @@ The following feature attributes are implemented:
  * `name` - localised name of the place
  * `housenumber`, `street`, `locality`, `district`, `postcode`, `city`,
    `county`, `state`, `country` -
-   provided when it can be determined from the address
+   provided when it can be determined from the address (only with `addressdetails=1`)
  * `admin` - list of localised names of administrative boundaries (only with `addressdetails=1`)
+ * `extra` - dictionary with additional useful tags like `website` or `maxspeed`
+   (only with `extratags=1`)
+
 
 Use `polygon_geojson` to output the full geometry of the object instead
 of the centroid.
diff --git a/docs/api/Search.md b/docs/api/Search.md
index 1c269168..3c9a7148 100644
--- a/docs/api/Search.md
+++ b/docs/api/Search.md
@@ -212,7 +212,7 @@ other layers.
 The featureType allows to have a more fine-grained selection for places
 from the address layer. Results can be restricted to places that make up
 the 'state', 'country' or 'city' part of an address. A featureType of
-settlement selects any human inhabited feature from 'state' down to
+`settlement` selects any human inhabited feature from 'state' down to
 'neighbourhood'.
 
 When featureType is set, then results are automatically restricted
diff --git a/docs/customize/Import-Styles.md b/docs/customize/Import-Styles.md
index 003e56e3..23778f77 100644
--- a/docs/customize/Import-Styles.md
+++ b/docs/customize/Import-Styles.md
@@ -1,95 +1,123 @@
-## Configuring the Import
+# Configuring the Import of OSM data
 
 In the very first step of a Nominatim import, OSM data is loaded into the
 database. Nominatim uses [osm2pgsql](https://osm2pgsql.org) for this task.
 It comes with a [flex style](https://osm2pgsql.org/doc/manual.html#the-flex-output)
 specifically tailored to filter and convert OSM data into Nominatim's
-internal data representation.
-
-There are a number of default configurations for the flex style which
-result in geocoding databases of different detail. The
+internal data representation. Nominatim ships with a few preset
+configurations for this import, each results in a geocoding database of
+different detail. The
 [Import section](../admin/Import.md#filtering-imported-data) explains
 these default configurations in detail.
 
-You can also create your own custom style. Put the style file into your
-project directory and then set `NOMINATIM_IMPORT_STYLE` to the name of the file.
-It is always recommended to start with one of the standard styles and customize
-those. You find the standard styles under the name `import-<stylename>.lua`
-in the standard Nominatim configuration path (usually `/etc/nominatim` or
-`/usr/local/etc/nominatim`).
+If you want to have more control over which OSM data is added to the database,
+you can also create your own custom style. Create a new lua style file, put it
+into your project directory and then set `NOMINATIM_IMPORT_STYLE` to the name
+of the file. Custom style files can be used to modify the existing preset
+configurations or to implement your own configuration from scratch.
 
 The remainder of the page describes how the flex style works and how to
 customize it.
 
-### The `flex-base.lua` module
+## The `flex-base` lua module
 
 The core of Nominatim's flex import configuration is the `flex-base` module.
 It defines the table layout used by Nominatim and provides standard
-implementations for the import callbacks that make it easy to customize
+implementations for the import callbacks that help with customizing
 how OSM tags are used by Nominatim.
 
-Every custom style should include this module to make sure that the correct
+Every custom style must include this module to make sure that the correct
 tables are created. Thus start your custom style as follows:
 
 ``` lua
 local flex = require('flex-base')
+```
+
+### Using preset configurations
+
+If you want to start with one of the existing presets, then you can import
+its settings using the `import_topic()` function:
+
+```
+local flex = require('flex-base')
 
+flex.import_topic('streets')
 ```
 
-The following sections explain how the module can be customized.
+The `import_topic` function takes an optional second configuration
+parameter. The available options are explained in the
+[themepark section](#using-osm2pgsql-themepark).
 
+!!! note
+    You can also directly import the preset style files, e.g.
+    `local flex = require('import-street')`. It is not possible to
+    set extra configuration this way.
 
-### Changing the recognized tags
+### How processing works
 
-If you just want to change which OSM tags are recognized during import,
-then there are a number of convenience functions to set the tag lists used
-during the processing.
+When Nominatim processes an OSM object, it looks for four kinds of tags:
+The _main tags_ classify what kind of place the OSM object represents. One
+OSM object can have more than one main tag. In such case one database entry
+is created for each main tag. _Name tags_ represent searchable names of the
+place. _Address tags_ are used to compute the address hierarchy of the place.
+Address tags are used for searching and for creating a display name of the place.
+_Extra tags_ are any tags that are not directly related to search but
+contain interesting additional information.
 
-!!! warning
-    There are no built-in defaults for the tag lists, so all the functions
-    need to be called from your style script to fully process the data.
-    Make sure you start from one of the default style and only modify
-    the data you are interested in. You can also derive your style from an
-    existing style by importing the appropriate module, e.g.
-    `local flex = require('import-street')`.
+!!! danger
+    Some tags in the extratags category are used by Nominatim to better
+    classify the place. You want to make sure these are always present
+    in custom styles.
 
-Many of the following functions take _key match lists_. These lists can
+Configuring the style means deciding which key and/or key/value is used
+in which category.
+
+## Changing the recognized tags
+
+The flex style offers a number of functions to set the classification of
+each OSM tag. Most of these functions can also take a preset string instead
+of a tag description. These presets describe common configurations that
+are also used in the definition of the predefined styles. This section
+lists the configuration functions and the accepted presets.
+
+#### Key match lists
+
+Some of the following functions take _key match lists_. These lists can
 contain three kinds of strings to match against tag keys:
 A string that ends in an asterisk `*` is a prefix match and accordingly matches
 against any key that starts with the given string (minus the `*`). 
 A suffix match can be defined similarly with a string that starts with a `*`.
 Any other string is matched exactly against tag keys.
 
+###  Main tags
+
+`set/modify_main_tags()` allow to define which tags are used as main tags. It
+takes a lua table parameter which defines for keys and key/value
+combinations, how they are classified.
+
+The following classifications are recognized:
 
-#### `set_main_tags()` - principal tags
-
-If a principal or main tag is found on an OSM object, then the object
-is included in Nominatim's search index. A single object may also have
-multiple main tags. In that case, the object will be included multiple
-times in the index, once for each main tag.
-
-The flex script distinguishes between four types of main tags:
-
-* __always__: a main tag that is used unconditionally
-* __named__: consider this main tag only, if the object has a proper name
-  (a reference is not enough, see below).
-* __named_with_key__: consider this main tag only, when the object has
-  a proper name with a domain prefix. For example, if the main tag is
-  `bridge=yes`, then it will only be added as an extra row, if there is
-  a tag `bridge:name[:XXX]` for the same object. If this property is set,
-  all other names that are not domain-specific are ignored.
-* __fallback__: use this main tag only, if there is no other main tag.
-  Fallback always implied `named`, i.e. fallbacks are only tried for
-  named objects.
-
-The `set_main_tags()` function takes exactly one table parameter which
-defines the keys and key/value combinations to include and the kind of
-main tag. Each lua table key defines an OSM tag key. The value may
-be a string defining the kind of main key as described above. Then the tag will
-be considered a main tag for any possible value. To further restrict
-which values are acceptable, give a table with the permitted values
-and their kind of main tag. If the table contains a simple value without
-key, then this is used as default for values that are not listed.
+| classification  | meaning |
+| :-------------- | :------ |
+| always          | Unconditionally use this tag as a main tag. |
+| named           | Consider as main tag, when the object has a primary name (see [names](#name-tags) below) |
+| named_with_key  | Consider as main tag, when the object has a primary name with a domain prefix. For example, if the main tag is  `bridge=yes`, then it will only be added as an extra entry, if there is a tag `bridge:name[:XXX]` for the same object. If this property is set, all names that are not domain-specific are ignored. |
+| fallback        | Consider as main tag only when no other main tag was found. Fallback always implies `named`, i.e. fallbacks are only tried for objects with primary names. |
+| delete          | Completely ignore the tag in any further processing |
+| extra           | Move the tag to extratags and then ignore it for further processing |
+| `<function>`| Advanced handling, see [below](#advanced-main-tag-handling) |
+
+Each key in the table parameter defines an OSM tag key. The value may
+be directly a classification as described above. Then the tag will
+be considered a main tag for any possible value that is not further defined.
+To further restrict which values are acceptable, give a table with the
+permitted values and their kind of main tag. If the table contains a simple
+value without key, then this is used as default for values that are not listed.
+
+`set_main_tags()` will completely replace the current main tag configuration
+with the new configuration. `modify_main_tags()` will merge the new
+configuration with the existing one. Otherwise, the two functions do exactly
+the same.
 
 !!! example
     ``` lua
@@ -97,80 +125,188 @@ key, then this is used as default for values that are not listed.
 
     flex.set_main_tags{
         boundary = {administrative = 'named'},
-        highway = {'always', street_lamp = 'named'},
+        highway = {'always', street_lamp = 'named', no = 'delete'},
         landuse = 'fallback'
     }
     ```
 
     In this example an object with a `boundary` tag will only be included
     when it has a value of `administrative`. Objects with `highway` tags are
-    always included. However when the value is `street_lamp` then the object
-    must have a name, too. With any other value, the object is included
-    independently of the name. Finally, if a `landuse` tag is present then
-    it will be used independely of the concrete value if neither boundary
+    always included with two exceptions: the troll tag `highway=no` is
+    deleted on the spot. And when the value is `street_lamp` then the object
+    must have a name, too. Finally, if a `landuse` tag is present then
+    it will be used independently of the concrete value when neither boundary
     nor highway tags were found and the object is named.
 
+##### Presets
 
-#### `set_prefilters()` - ignoring tags
+| Name   | Description |
+| :----- | :---------- |
+| admin  | Basic tag set collecting places and administrative boundaries. This set is needed also to ensure proper address computation and should therefore always be present. You can disable selected place types like `place=locality` after adding this set, if they are not relevant for your use case. |
+| all_boundaries | Extends the set of recognized boundaries and places to all available ones. |
+| natural | Tags for natural features like rivers and mountain peaks. |
+| street/default | Tags for streets. Major streets are always included, minor ones only when they have a name. |
+| street/car | Tags for all streets that can be used by a motor vehicle. |
+| street/all | Includes all highway features named and unnamed. |
+| poi/delete | Adds most POI features with and without name. Some frequent but very domain-specific values are excluded by deleting them. |
+| poi/extra | Like 'poi/delete' but excluded values are moved to extratags. |
 
-Pre-filtering of tags allows to ignore them for any further processing.
-Thus pre-filtering takes precedence over any other tag processing. This is
-useful when some specific key/value combinations need to be excluded from
-processing. When tags are filtered, they may either be deleted completely
-or moved to `extratags`. Extra tags are saved with the object and returned
-to the user when requested, but are not used otherwise.
 
-`set_prefilters()` takes a table with four optional fields:
+##### Advanced main tag handling
 
-* __delete_keys__ is a _key match list_ for tags that should be deleted
-* __delete_tags__ contains a table of tag keys pointing to a list of tag
-  values. Tags with matching key/value pairs are deleted.
-* __extra_keys__ is a _key match list_ for tags which should be saved into
-  extratags
-* __extra_tags__ contains a table of tag keys pointing to a list of tag
-  values. Tags with matching key/value pairs are moved to extratags.
+The groups described above are in fact only a preset for a filtering function
+that is used to make the final decision how a pre-selected main tag is entered
+into Nominatim's internal table. To further customize handling you may also
+supply your own filtering function.
 
-Key list may contain three kinds of strings:
-A string that ends in an asterisk `*` is a prefix match and accordingly matches
-against any key that starts with the given string (minus the `*`). 
-A suffix match can be defined similarly with a string that starts with a `*`.
-Any other string is matched exactly against tag keys.
+The function takes up to three parameters: a Place object of the object
+being processed, the key of the main tag and the value of the main tag.
+The function may return one of three values:
+
+* `nil` or `false` causes the entry to be ignored
+* the Place object causes the place to be added as is
+* `Place.copy(names=..., address=..., extratags=...) causes the
+  place to be enter into the database but with name/address/extratags
+  set to the given different values.
+
+The Place object has some read-only values that can be used to determine
+the handling:
+
+* **object** is the original OSM object data handed in by osm2pgsql
+* **admin_level** is the content of the admin_level tag, parsed into an integer and normalized to a value between 0 and 15
+* **has_name** is a boolean indicating if the object has a primary name tag
+* **names** is a table with the collected list of name tags
+* **address** is a table with the collected list of address tags
+* **extratags** is a table with the collected list of additional tags to save
 
 !!! example
     ``` lua
-    local flex = require('import-full')
+    local flex = require('flex-base')
 
-    flex.set_prefilters{
-        delete_keys = {'source', 'source:*'},
-        extra_tags = {amenity = {'yes', 'no'}}
-    }
-    flex.set_main_tags{
-        amenity = 'always'
-    }
+    flex.add_topic('street')
+
+    local function no_sidewalks(place, k, v)
+        if place.object.tags.footway == 'sidewalk' then
+            return false
+        end
+
+        -- default behaviour is to have all footways
+        return place
+    end
+
+    flex.modify_main_tags(highway = {'footway' = no_sidewalks}
+    ```
+    This script adds a custom handler for `highway=footway`. It only includes
+    them in the database, when the object doesn't have a tag `footway=sidewalk`
+    indicating that it is just part of a larger street which should already
+    be indexed. Note that it is not necessary to check the key and value
+    of the main tag because the function is only used for the specific
+    main tag.
+
+
+### Ignored tags
+
+The function `ignore_keys()` sets the `delete` classification for keys.
+This function takes a _key match list_ so that it is possible to exclude
+groups of keys.
+
+Note that full matches always take precedence over suffix matches, which
+in turn take precedence over prefix matches.
+
+!!! example
+    ``` lua
+    local flex = require('flex-base')
+
+    flex.add_topic('admin')
+    flex.ignore_keys{'old_name', 'old_name:*'}
     ```
 
-    In this example any tags `source` and tags that begin with `source:`  are
-    deleted before any other processing is done. Getting rid of frequent tags
-    this way can speed up the import.
+    This example uses the `admin` preset with the exception that names
+    that are no longer are in current use, are ignored.
+
+##### Presets
 
-    Tags with `amenity=yes` or `amenity=no` are moved to extratags. Later
-    all tags with an `amenity` key are made a main tag. This effectively means
-    that Nominatim will use all amenity tags except for those with value
-    yes and no.
+| Name     | Description |
+| :-----   | :---------- |
+| metatags | Tags with meta information about the OSM tag like source, notes and import sources. |
+| name     | Non-names that actually describe properties or name parts. These names can throw off search and should always be removed. |
+| address  | Extra `addr:*` tags that are not useful for Nominatim. |
 
-#### `set_name_tags()` - defining names
 
-The flex script distinguishes between two kinds of names:
+### Tags for `extratags`
 
-* __main__: the primary names make an object fully searchable.
-  Main tags of type _named_ will only cause the object to be included when
-  such a primary name is present. Primary names are usually those found
-  in the `name` tag and its variants.
-* __extra__: extra names are still added to the search index but they are
-  alone not sufficient to make an object named.
+The function `add_for_extratags()` sets the `extra` classification for keys.
+This function takes a
+_key match list_ so that it is possible to move groups of keys to extratags.
 
-`set_name_tags()` takes a table with two optional fields `main` and `extra`.
-They take _key match lists_ for main and extra names respectively.
+Note that full matches always take precedence over suffix matches, which
+in turn take precedence over prefix matches.
+
+!!! example
+    ``` lua
+    local flex = require('flex-base')
+
+    flex.add_topic('street')
+    flex.add_for_extratags{'surface', 'access', 'vehicle', 'maxspeed'}
+    ```
+
+    This example uses the `street` preset but adds a couple of tags that
+    are of interest about the condition of the street.
+
+##### Presets
+
+| Name     | Description |
+| :-----   | :---------- |
+| required | Tags that Nominatim will use for various computations when present in extratags. Always include these. |
+
+In addition, all [presets from ignored tags](#presets_1) are accepted.
+
+### General pre-filtering
+
+_(deprecated)_ `set_prefilters()` allows to set the `delete` and `extra`
+classification for main tags.
+
+This function removes all previously set main tags with `delete` and `extra`
+classification and then adds the newly defined tags.
+
+`set_prefilters()` takes a table with four optional fields:
+
+* __delete_keys__ is a _key match list_ for tags that should be deleted
+* __delete_tags__ contains a table of tag keys pointing to a list of tag
+  values. Tags with matching key/value pairs are deleted.
+* __extra_keys__ is a _key match list_ for tags which should be saved into
+  extratags
+* __extra_tags__ contains a table of tag keys pointing to a list of tag
+  values. Tags with matching key/value pairs are moved to extratags.
+
+!!! danger "Deprecation warning"
+    Use of this function should be replaced with `modify_main_tags()` to
+    set the data from `delete_tags` and `extra_tags`, with `ignore_keys()`
+    for the `delete_keys` parameter and with `add_for_extratags()` for the
+    `extra_keys` parameter.
+
+### Name tags
+
+`set/modify_name_tags()` allow to define the tags used for naming places. Name tags
+can only be selected by their keys. The import script distinguishes
+between primary and auxiliary names. A primary name is the given name of
+a place. Having a primary name makes a place _named_. This is important
+for main tags that are only included when a name is present. Auxiliary names
+are identifiers like references. They may be searched for but should not
+be included on their own.
+
+The functions take a table with two optional fields `main` and `extra`.
+They take _key match lists_ for primary and auxiliary names respectively.
+A third field `house` can contain tags for names that appear in place of
+house numbers in addresses. This field can only contain complete key names.
+'house tags' are special in that they cause the OSM object to be added to
+the database independently of the presence of other main tags.
+
+`set_name_tags()` overwrites the current configuration, while
+`modify_name_tags()` replaces the fields that are given. (Be aware that
+the fields are replaced as a whole. `main = {'foo_name'}` will cause
+`foo_name` to become the only recognized primary name. Any previously
+defined primary names are forgotten.)
 
 !!! example
     ``` lua
@@ -186,29 +322,33 @@ They take _key match lists_ for main and extra names respectively.
     only include those that have a common name and not those which just
     have some reference ID from the city.
 
-#### `set_address_tags()` - defining address parts
+##### Presets
 
-Address tags will be used to build up the address of an object.
+| Name     | Description |
+| :-----   | :---------- |
+| core     | Basic set of recognized names for all places. |
+| address  | Additional names useful when indexing full addresses. |
+| poi      | Extended set of recognized names for pois. Use on top of the core set. |
 
-`set_address_tags()` takes a table with arbitrary fields pointing to
-_key match lists_. Two fields have a special meaning:
+### Address tags
 
-* __main__: defines
-the tags that make a full address object out of the OSM object. This
-is usually the housenumber or variants thereof. If a main address tag
-appears, then the object will always be included, if necessary with a
-fallback of `place=house`. If the key has a prefix of `addr:` or `is_in:`
-this will be stripped.
+`set/modify_address_tags()` defines the tags that will be used to build
+up the address of an object. Address tags can only be chosen by their key.
 
-* __extra__: defines all supplementary tags for addresses, tags like `addr:street`, `addr:city` etc. If the key has a prefix of `addr:` or `is_in:` this will be stripped.
+The functions take a table with arbitrary fields, each defining
+a key list or _key match list_. Some fields have a special meaning:
 
-All other fields will be handled as summary fields. If a key matches the
-key match list, then its value will be added to the address tags with the
-name of the field as key. If multiple tags match, then an arbitrary one
-wins.
+| Field     | Type      | Description |
+| :---------| :-------- | :-----------|
+| main      | key list  | Tags that make a full address object out of the OSM object. This is usually the house number or variants thereof. If a main address tag appears, then the object will always be included, if necessary with a fallback of `place=house`. If the key has a prefix of `addr:` or `is_in:` this will be stripped. |
+| extra     | key match list | Supplementary tags for addresses, tags like `addr:street`, `addr:city` etc. If the key has a prefix of `addr:` or `is_in:` this will be stripped. |
+| interpolation | key list | Tags that identify address interpolation lines. |
+| country   | key match list | Tags that may contain the country the place is in. The first found value with a two-letter code will be accepted, all other values are discarded. |
+| _other_   | key match list | Summary field. If a key matches the key match list, then its value will be added to the address tags with the name of the field as key. If multiple tags match, then an arbitrary one wins. |
 
-Country tags are handled slightly special. Only tags with a two-letter code
-are accepted, all other values are discarded.
+`set_address_tags()` overwrites the current configuration, while
+`modify_address_tags()` replaces the fields that are given. (Be aware that
+the fields are replaced as a whole.)
 
 !!! example
     ``` lua
@@ -232,21 +372,33 @@ are accepted, all other values are discarded.
     to postcodes, they will always be saved under the key `postcode` thus
     normalizing the multitude of keys that are used in the OSM database.
 
+##### Presets
+
+| Name     | Description |
+| :-----   | :---------- |
+| core     | Basic set of tags needed to recognize address relationship for any place. Always include this. |
+| houses   | Additional set of tags needed to recognize proper addresses |
 
-#### `set_unused_handling()` - processing remaining tags
+### Handling of unclassified tags
 
-This function defines what to do with tags that remain after all tags
+`set_unused_handling()` defines what to do with tags that remain after all tags
 have been classified using the functions above. There are two ways in
 which the function can be used:
 
 `set_unused_handling(delete_keys = ..., delete_tags = ...)` deletes all
 keys that match the descriptions in the parameters and moves all remaining
 tags into the extratags list.
+
 `set_unused_handling(extra_keys = ..., extra_tags = ...)` moves all tags
 matching the parameters into the extratags list and then deletes the remaining
 tags. For the format of the parameters see the description in `set_prefilters()`
 above.
 
+When no special handling is set, then unused tags will be discarded with one
+exception: place tags are kept in extratags for administrative boundaries.
+When using a custom setting, you should also make sure that the place tag
+is added for extratags.
+
 !!! example
     ``` lua
     local flex = require('import-full')
@@ -263,17 +415,23 @@ above.
     already delete the tiger tags with `set_prefilters()` because that
     would remove tiger:county before the address tags are processed.
 
-### Customizing osm2pgsql callbacks
+## Customizing osm2pgsql callbacks
 
 osm2pgsql expects the flex style to implement three callbacks, one process
 function per OSM type. If you want to implement special handling for
 certain OSM types, you can override the default implementations provided
 by the flex-base module.
 
-#### Changing the relation types to be handled
+### Enabling additional relation types
 
-The default scripts only allows relations of type `multipolygon`, `boundary`
-and `waterway`. To add other types relations, set `RELATION_TYPES` for
+OSM relations can represent very diverse
+[types of real-world objects](https://wiki.openstreetmap.org/wiki/Key:type). To
+be able to process them correctly, Nominatim needs to understand how to
+create a geometry for each type. By default, the script knows how to
+process relations of type `multipolygon`, `boundary` and `waterway`. All
+other relation types are ignored.
+
+To add other types relations, set `RELATION_TYPES` for
 the type to the kind of geometry that should be created. The following
 kinds of geometries can be used:
 
@@ -297,7 +455,7 @@ kinds of geometries can be used:
     geometry.
 
 
-#### Adding additional logic to processing functions
+### Adding additional logic to processing functions
 
 The default processing functions are also exported by the flex-base module
 as `process_node`, `process_way` and `process_relation`. These can be used
@@ -322,110 +480,83 @@ logic.
 
 ### Customizing the main processing function
 
-The main processing function of the flex style can be found in the function
-`process_tags`. This function is called for all OSM object kinds and is
-responsible for filtering the tags and writing out the rows into Postgresql.
+!!! danger "Deprecation Warning"
+    The style used to allow overwriting the internal processing function
+    `process_tags()`. While this is currently still possible, it is no longer
+    encouraged and may stop working in future versions. The internal
+    `Place` class should now be considered read-only.
+
+
+## Using osm2pgsql-themepark
+
+The Nominatim osm2pgsql style is designed so that it can also be used as
+a theme for [osm2pgsql-themepark](https://osm2pgsql.org/themepark/). This
+makes it easy to combine Nominatim with other projects like
+[openstreetmap-carto](https://github.com/gravitystorm/openstreetmap-carto)
+in the same database.
+
+To set up one of the preset styles, simply include a topic with the same name:
+
+```
+local themepark = require('themepark')
+themepark:add_topic('nominatim/address')
+```
+
+Themepark topics offer two configuration options:
+
+* **street_theme** allows to choose one of the sub topics for streets:
+    * _default_ - include all major streets and named minor paths
+    * _car_ - include all streets physically usable by cars
+    * _all_ - include all major streets and minor paths
+* **with_extratags**, when set to a truthy value, then tags that are
+  not specifically used for address or naming are added to the
+  extratags column
+
+The customization functions described in the
+[Changing recognized tags](#changing-the-recognized-tags) section
+are available from the theme. To access the theme you need to explicitly initialize it.
 
 !!! Example
     ``` lua
-    local flex = require('import-full')
+    local themepark = require('themepark')
 
-    local original_process_tags = flex.process_tags
+    themepark:add_topic('nominatim/full', {with_extratags = true})
 
-    function flex.process_tags(o)
-        if o.object.tags.highway ~= nil and o.object.tags.access == 'no' then
-            return
-        end
+    local flex = themepark:init_theme('nominatim')
+
+    flex.modify_main_tags{'amenity' = {
+                           'waste_basket' = 'delete'}
+                      }
+    ```
+    This example uses the full Nominatim configuration but disables
+    importing waste baskets.
+
+You may also write a new configuration from scratch. Simply omit including
+a Nominatim topic and only call the required customization functions.
 
-        original_process_tags(o)
+Customizing the osm2pgsql processing functions as explained
+[above](#adding-additional-logic-to-processing-functions) is not possible
+when running under themepark. Instead include other topics that make the
+necessary modifications or add an additional processor before including
+the Nominatim topic.
+
+!!! Example
+    ``` lua
+    local themepark = require('themepark')
+
+    local function discard_country_boundaries(object)
+        if object.tags.boundary == 'administrative' and object.tags.admin_level == '2' then
+            return 'stop'
+        end
     end
+
+    themepark:add_proc('relation', discard_country_boundaries)
+    -- Order matters here. The topic needs to be added after the custom callback.
+    themepark:add_topic('nominatim/full', {with_extratags = true})
     ```
+    Discarding country-level boundaries when running under themepark.
 
-    This example shows the most simple customization of the process_tags function.
-    It simply adds some additional processing before running the original code.
-    To do that, first save the original function and then overwrite process_tags
-    from the module. In this example all highways which are not accessible
-    by anyone will be ignored.
-
-
-#### The `Place` class
-
-The `process_tags` function receives a Lua object of `Place` type which comes
-with some handy functions to collect the data necessary for geocoding and
-writing it into the place table. Always use this object to fill the table.
-
-The Place class has some attributes which you may access read-only:
-
-* __object__ is the original OSM object data handed in by osm2pgsql
-* __admin_level__ is the content of the admin_level tag, parsed into an
-  integer and normalized to a value between 0 and 15
-* __has_name__ is a boolean indicating if the object has a full name
-* __names__ is a table with the collected list of name tags
-* __address__ is a table with the collected list of address tags
-* __extratags__ is a table with the collected list of additional tags to save
-
-There are a number of functions to fill these fields. All functions expect
-a table parameter with fields as indicated in the description.
-Many of these functions expect match functions which are described in detail
-further below.
-
-* __delete{match=...}__ removes all tags that match the match function given
-  in _match_.
-* __grab_extratags{match=...}__ moves all tags that match the match function
-  given in _match_ into extratags. Returns the number of tags moved.
-* __clean{delete=..., extra=...}__ deletes all tags that match _delete_ and
-  moves the ones that match _extra_  into extratags
-* __grab_address_parts{groups=...}__ moves matching tags into the address table.
-  _groups_ must be a group match function. Tags of the group `main` and
-  `extra` are added to the address table as is but with `addr:` and `is_in:`
-  prefixes removed from the tag key. All other groups are added with the
-  group name as key and the value from the tag. Multiple values of the same
-  group overwrite each other. The function returns the number of tags saved
-  from the main group.
-* __grab_main_parts{groups=...}__ moves matching tags into the name table.
-  _groups_ must be a group match function. If a tags of the group `main` is
-  present, the object will be marked as having a name. Tags of group `house`
-  produce a fallback to `place=house`. This fallback is return by the function
-  if present.
-
-There are two functions to write a row into the place table. Both functions
-expect the main tag (key and value) for the row and then use the collected
-information from the name, address, extratags etc. fields to complete the row.
-They also have a boolean parameter `save_extra_mains` which defines how any
-unprocessed tags are handled: when True, the tags will be saved as extratags,
-when False, they will be simply discarded.
-
-* __write_row(key, value, save_extra_mains)__ creates a new table row from
-  the current state of the Place object.
-* __write_place(key, value, mtype, save_extra_mains)__ creates a new row
-  conditionally. When value is nil, the function will attempt to look up the
-  value in the object tags. If value is still nil or mtype is nil, the row
-  is ignored. An mtype of `always` will then always write out the row,
-  a mtype of `named` only, when the object has a full name. When mtype
-  is `named_with_key`, the function checks for a domain name, i.e. a name
-  tag prefixed with the name of the main key. Only if at least one is found,
-  the row will be written. The names are replaced with the domain names found.
-
-#### Match functions
-
-The Place functions usually expect either a _match function_ or a
-_group match function_ to find the tags to apply their function to.
-
-The __match function__ is a Lua function which takes two parameters,
-key and value, and returns a boolean to indicate that a tag matches. The
-flex-base module has a convenience function `tag_match()` to create such a
-function. It takes a table with two optional fields: `keys` takes a key match
-list (see above), `tags` takes a table with keys that point to a list of
-possible values, thus defining key/value matches.
-
-The __group match function__ is a Lua function which also takes two parameters,
-key and value, and returns a string indicating to which group or type they
-belong to. The `tag_group()` can be used to create such a function. It expects
-a table where the group names are the keys and the values are a key match list.
-
-
-
-### Using the gazetteer output of osm2pgsql
+## osm2pgsql gazetteer output
 
 Nominatim still allows you to configure the gazetteer output to remain
 backwards compatible with older imports. It will be automatically used
@@ -435,9 +566,9 @@ of Nominatim. Do not use the gazetteer output for new imports. There is no
 guarantee that new versions of Nominatim are fully compatible with the
 gazetteer output.
 
-### Changing the Style of Existing Databases
+## Changing the style of existing databases
 
-There is normally no issue changing the style of a database that is already
+There is usually no issue changing the style of a database that is already
 imported and now kept up-to-date with change files. Just be aware that any
 change in the style applies to updates only. If you want to change the data
 that is already in the database, then a reimport is necessary.
diff --git a/docs/customize/Settings.md b/docs/customize/Settings.md
index b00d04cf..edf2241b 100644
--- a/docs/customize/Settings.md
+++ b/docs/customize/Settings.md
@@ -336,7 +336,7 @@ NOMINATIM_TABLESPACE_SEARCH_INDEX
 NOMINATIM_TABLESPACE_OSM_DATA
 :    Raw OSM data cache used for import and updates.
 
-NOMINATIM_TABLESPACE_OSM_DATA
+NOMINATIM_TABLESPACE_OSM_INDEX
 :    Indexes on the raw OSM data cache.
 
 NOMINATIM_TABLESPACE_PLACE_DATA
@@ -602,6 +602,43 @@ results gathered so far.
 Note that under high load you may observe that users receive different results
 than usual without seeing an error. This may cause some confusion.
 
+#### NOMINATIM_OUTPUT_NAMES
+
+| Summary            |                                                     |
+| --------------     | --------------------------------------------------- |
+| **Description:**   | Specifies order of name tags |
+| **Format:**        | string: comma-separated list of tag names |
+| **Default:**       | name:XX,name,brand,official_name:XX,short_name:XX,official_name,short_name,ref |
+
+Specifies the order in which different name tags are used.
+The values in this list determine the preferred order of name variants,
+including language-specific names (in OSM: the name tag with and without any language suffix).
+
+Comma-separated list, where :XX stands for language suffix
+(e.g. name:en) and no :XX stands for general tags (e.g. name).
+
+See also [NOMINATIM_DEFAULT_LANGUAGE](#nominatim_default_language).
+
+!!! note
+    If NOMINATIM_OUTPUT_NAMES = `name:XX,name,short_name:XX,short_name` the search follows
+
+        ```
+        'name', 'short_name'
+        ```
+
+    if we have no preferred language order for showing search results.
+
+    For languages ['en', 'es'] the search follows
+
+        ```
+        'name:en', 'name:es',
+        'name',
+        'short_name:en', 'short_name:es',
+        'short_name'
+        ```
+
+    For those familiar with the internal implementation, the `_place_*` expansion is added, but to simplify, it is not included in this example.
+
 ### Logging Settings
 
 #### NOMINATIM_LOG_DB
diff --git a/docs/customize/Special-Phrases.md b/docs/customize/Special-Phrases.md
index 4824512b..3ab837f2 100644
--- a/docs/customize/Special-Phrases.md
+++ b/docs/customize/Special-Phrases.md
@@ -17,7 +17,7 @@ columns:
 
  * **phrase**: the keyword to look for
  * **class**: key of the main tag of the place to find
-   (see [principal tags in import style](Import-Styles.md#set_main_tags-principal-tags)
+   (see [Import styles](Import-Styles.md#how-processing-works)
  * **type**: value of the main tag
  * **operator**: type of special phrase, may be one of:
      * *in*: place is within the place defined by the search term (e.g. "_Hotels in_ Berlin")
diff --git a/docs/customize/Tokenizers.md b/docs/customize/Tokenizers.md
index 30be170e..23db34c9 100644
--- a/docs/customize/Tokenizers.md
+++ b/docs/customize/Tokenizers.md
@@ -4,12 +4,11 @@ The tokenizer module in Nominatim is responsible for analysing the names given
 to OSM objects and the terms of an incoming query in order to make sure, they
 can be matched appropriately.
 
-Nominatim offers different tokenizer modules, which behave differently and have
-different configuration options. This sections describes the tokenizers and how
-they can be configured.
+Nominatim currently offers only one tokenizer module, the ICU tokenizer. This section
+describes the tokenizer and how it can be configured.
 
 !!! important
-    The use of a tokenizer is tied to a database installation. You need to choose
+    The selection of tokenizer is tied to a database installation. You need to choose
     and configure the tokenizer before starting the initial import. Once the import
     is done, you cannot switch to another tokenizer anymore. Reconfiguring the
     chosen tokenizer is very limited as well. See the comments in each tokenizer
@@ -43,10 +42,19 @@ On import the tokenizer processes names in the following three stages:
    See the [Token analysis](#token-analysis) section below for more
    information.
 
-During query time, only normalization and transliteration are relevant.
-An incoming query is first split into name chunks (this usually means splitting
-the string at the commas) and the each part is normalised and transliterated.
-The result is used to look up places in the search index.
+During query time, the tokeinzer is responsible for processing incoming
+queries. This happens in two stages:
+
+1. During **query preprocessing** the incoming text is split into name
+   chunks and normalised. This usually means applying the same normalisation
+   as during the import process but may involve other processing like,
+   for example, word break detection.
+2. The **token analysis** step breaks down the query parts into tokens,
+   looks them up in the database and assigns them possible functions and
+   probabilities.
+
+Query processing can be further customized while the rest of the analysis
+is hard-coded.
 
 ### Configuration
 
@@ -58,6 +66,14 @@ have no effect.
 Here is an example configuration file:
 
 ``` yaml
+query-preprocessing:
+    - step: split_japanese_phrases
+    - step: regex_replace
+      replacements:
+        - pattern: https?://[^\s]* # Filter URLs starting with http or https
+          replace: ''
+    - step: normalize
+
 normalization:
     - ":: lower ()"
     - "Ã > 'ss'" # German szet is unambiguously equal to double ss
@@ -78,8 +94,37 @@ token-analysis:
             replacements: ['Ã¤', 'ae']
 ```
 
-The configuration file contains four sections:
-`normalization`, `transliteration`, `sanitizers` and `token-analysis`.
+The configuration file contains five sections:
+`query-preprocessing`, `normalization`, `transliteration`, `sanitizers` and `token-analysis`.
+
+#### Query preprocessing
+
+The section for `query-preprocessing` defines an ordered list of functions
+that are applied to the query before the token analysis.
+
+The following is a list of preprocessors that are shipped with Nominatim.
+
+##### normalize
+
+::: nominatim_api.query_preprocessing.normalize
+    options:
+        members: False
+        heading_level: 6
+        docstring_section_style: spacy
+
+##### regex-replace
+
+::: nominatim_api.query_preprocessing.regex_replace
+    options:
+        members: False
+        heading_level: 6
+        docstring_section_style: spacy
+    description: 
+        This option runs any given regex pattern on the input and replaces values accordingly
+    replacements:
+        - pattern: regex pattern
+          replace: string to replace with
+
 
 #### Normalization and Transliteration
 
diff --git a/docs/develop/Development-Environment.md b/docs/develop/Development-Environment.md
index a6558c7d..5f247455 100644
--- a/docs/develop/Development-Environment.md
+++ b/docs/develop/Development-Environment.md
@@ -25,15 +25,15 @@ following packages should get you started:
 
 ## Prerequisites for testing and documentation
 
-The Nominatim test suite consists of behavioural tests (using behave) and
+The Nominatim test suite consists of behavioural tests (using pytest-bdd) and
 unit tests (using pytest). It has the following additional requirements:
 
-* [behave test framework](https://behave.readthedocs.io) >= 1.2.6
 * [flake8](https://flake8.pycqa.org/en/stable/) (CI always runs the latest version from pip)
 * [mypy](http://mypy-lang.org/) (plus typing information for external libs)
 * [Python Typing Extensions](https://github.com/python/typing_extensions) (for Python < 3.9)
 * [pytest](https://pytest.org)
 * [pytest-asyncio](https://pytest-asyncio.readthedocs.io)
+* [pytest-bdd](https://pytest-bdd.readthedocs.io)
 
 For testing the Python search frontend, you need to install extra dependencies
 depending on your choice of webserver framework:
@@ -48,9 +48,6 @@ The documentation is built with mkdocs:
 * [mkdocs-material](https://squidfunk.github.io/mkdocs-material/)
 * [mkdocs-gen-files](https://oprypin.github.io/mkdocs-gen-files/)
 
-Please be aware that tests always run against the globally installed
-osm2pgsql, so you need to have this set up. If you want to test against
-the vendored version of osm2pgsql, you need to set the PATH accordingly.
 
 ### Installing prerequisites on Ubuntu/Debian
 
@@ -59,7 +56,9 @@ The easiest way, to handle these Python dependencies is to run your
 development from within a virtual environment.
 
 ```sh
-sudo apt install libsqlite3-mod-spatialite
+sudo apt install libsqlite3-mod-spatialite osm2pgsql \
+                 postgresql-postgis postgresql-postgis-scripts \
+                 pkg-config libicu-dev virtualenv
 ```
 
 To set up the virtual environment with all necessary packages run:
@@ -67,9 +66,10 @@ To set up the virtual environment with all necessary packages run:
 ```sh
 virtualenv ~/nominatim-dev-venv
 ~/nominatim-dev-venv/bin/pip install\
-    psutil psycopg[binary] PyICU SQLAlchemy \
-    python-dotenv jinja2 pyYAML datrie behave \
-    mkdocs mkdocstrings mkdocs-gen-files pytest pytest-asyncio flake8 \
+    psutil 'psycopg[binary]' PyICU SQLAlchemy \
+    python-dotenv jinja2 pyYAML \
+    mkdocs 'mkdocstrings[python]' mkdocs-gen-files \
+    pytest pytest-asyncio pytest-bdd flake8 \
     types-jinja2 types-markupsafe types-psutil types-psycopg2 \
     types-pygments types-pyyaml types-requests types-ujson \
     types-urllib3 typing-extensions unicorn falcon starlette \
diff --git a/docs/develop/ICU-Tokenizer-Modules.md b/docs/develop/ICU-Tokenizer-Modules.md
index d189422a..30b85ac7 100644
--- a/docs/develop/ICU-Tokenizer-Modules.md
+++ b/docs/develop/ICU-Tokenizer-Modules.md
@@ -14,10 +14,11 @@ of sanitizers and token analysis.
     implemented, it is not guaranteed to be stable at the moment.
 
 
-## Using non-standard sanitizers and token analyzers
+## Using non-standard modules
 
-Sanitizer names (in the `step` property) and token analysis names (in the
-`analyzer`) may refer to externally supplied modules. There are two ways
+Sanitizer names (in the `step` property), token analysis names (in the
+`analyzer`) and query preprocessor names (in the `step` property)
+may refer to externally supplied modules. There are two ways
 to include external modules: through a library or from the project directory.
 
 To include a module from a library, use the absolute import path as name and
@@ -27,6 +28,53 @@ To use a custom module without creating a library, you can put the module
 somewhere in your project directory and then use the relative path to the
 file. Include the whole name of the file including the `.py` ending.
 
+## Custom query preprocessors
+
+A query preprocessor must export a single factory function `create` with
+the following signature:
+
+``` python
+create(self, config: QueryConfig) -> Callable[[list[Phrase]], list[Phrase]]
+```
+
+The function receives the custom configuration for the preprocessor and
+returns a callable (function or class) with the actual preprocessing
+code. When a query comes in, then the callable gets a list of phrases
+and needs to return the transformed list of phrases. The list and phrases
+may be changed in place or a completely new list may be generated.
+
+The `QueryConfig` is a simple dictionary which contains all configuration
+options given in the yaml configuration of the ICU tokenizer. It is up to
+the function to interpret the values.
+
+A `nominatim_api.search.Phrase` describes a part of the query that contains one or more independent
+search terms. Breaking a query into phrases helps reducing the number of
+possible tokens Nominatim has to take into account. However a phrase break
+is definitive: a multi-term search word cannot go over a phrase break.
+A Phrase object has two fields:
+
+ * `ptype` further refines the type of phrase (see list below)
+ * `text` contains the query text for the phrase
+
+The order of phrases matters to Nominatim when doing further processing.
+Thus, while you may split or join phrases, you should not reorder them
+unless you really know what you are doing.
+
+Phrase types can further help narrowing down how the tokens in the phrase
+are interpreted. The following phrase types are known:
+
+| Name           | Description |
+|----------------|-------------|
+| PHRASE_ANY     | No specific designation (i.e. source is free-form query) |
+| PHRASE_AMENITY | Contains name or type of a POI |
+| PHRASE_STREET  | Contains a street name optionally with a housenumber |
+| PHRASE_CITY    | Contains the postal city |
+| PHRASE_COUNTY  | Contains the equivalent of a county |
+| PHRASE_STATE   | Contains a state or province |
+| PHRASE_POSTCODE| Contains a postal code |
+| PHRASE_COUNTRY | Contains the country name or code |
+
+
 ## Custom sanitizer modules
 
 A sanitizer module must export a single factory function `create` with the
@@ -90,21 +138,22 @@ adding extra attributes) or completely replace the list with a different one.
 The following sanitizer removes the directional prefixes from street names
 in the US:
 
-``` python
-import re
-
-def _filter_function(obj):
-    if obj.place.country_code == 'us' \
-       and obj.place.rank_address >= 26 and obj.place.rank_address <= 27:
-        for name in obj.names:
-            name.name = re.sub(r'^(north|south|west|east) ',
-                               '',
-                               name.name,
-                               flags=re.IGNORECASE)
-
-def create(config):
-    return _filter_function
-```
+!!! example
+    ``` python
+    import re
+
+    def _filter_function(obj):
+        if obj.place.country_code == 'us' \
+           and obj.place.rank_address >= 26 and obj.place.rank_address <= 27:
+            for name in obj.names:
+                name.name = re.sub(r'^(north|south|west|east) ',
+                                   '',
+                                   name.name,
+                                   flags=re.IGNORECASE)
+
+    def create(config):
+        return _filter_function
+    ```
 
 This is the most simple form of a sanitizer module. If defines a single
 filter function and implements the required `create()` function by returning
@@ -128,13 +177,13 @@ sanitizers:
 
 !!! warning
     This example is just a simplified show case on how to create a sanitizer.
-    It is not really read for real-world use: while the sanitizer would
+    It is not really meant for real-world use: while the sanitizer would
     correctly transform `West 5th Street` into `5th Street`. it would also
     shorten a simple `North Street` to `Street`.
 
 For more sanitizer examples, have a look at the sanitizers provided by Nominatim.
 They can be found in the directory
-[`nominatim/tokenizer/sanitizers`](https://github.com/osm-search/Nominatim/tree/master/nominatim/tokenizer/sanitizers).
+[`src/nominatim_db/tokenizer/sanitizers`](https://github.com/osm-search/Nominatim/tree/master/src/nominatim_db/tokenizer/sanitizers).
 
 
 ## Custom token analysis module
diff --git a/docs/develop/Testing.md b/docs/develop/Testing.md
index 12673d40..738fa4b8 100644
--- a/docs/develop/Testing.md
+++ b/docs/develop/Testing.md
@@ -43,53 +43,53 @@ The name of the pytest binary depends on your installation.
 ## BDD Functional Tests (`test/bdd`)
 
 Functional tests are written as BDD instructions. For more information on
-the philosophy of BDD testing, see the
-[Behave manual](http://pythonhosted.org/behave/philosophy.html).
-
-The following explanation assume that the reader is familiar with the BDD
-notations of features, scenarios and steps.
-
-All possible steps can be found in the `steps` directory and should ideally
-be documented.
+the philosophy of BDD testing, read the Wikipedia article on
+[Behaviour-driven development](https://en.wikipedia.org/wiki/Behavior-driven_development).
 
 ### General Usage
 
 To run the functional tests, do
 
-    cd test/bdd
-    behave
-
-The tests can be configured with a set of environment variables (`behave -D key=val`):
-
- * `TEMPLATE_DB` - name of template database used as a skeleton for
-                   the test databases (db tests)
- * `TEST_DB` - name of test database (db tests)
- * `API_TEST_DB` - name of the database containing the API test data (api tests)
- * `API_TEST_FILE` - OSM file to be imported into the API test database (api tests)
- * `API_ENGINE` - webframe to use for running search queries, same values as
-                  `nominatim serve --engine` parameter
- * `DB_HOST` - (optional) hostname of database host
- * `DB_PORT` - (optional) port of database on host
- * `DB_USER` - (optional) username of database login
- * `DB_PASS` - (optional) password for database login
- * `REMOVE_TEMPLATE` - if true, the template and API database will not be reused
-                       during the next run. Reusing the base templates speeds
-                       up tests considerably but might lead to outdated errors
-                       for some changes in the database layout.
- * `KEEP_TEST_DB` - if true, the test database will not be dropped after a test
-                    is finished. Should only be used if one single scenario is
-                    run, otherwise the result is undefined.
-
-Logging can be defined through command line parameters of behave itself. Check
-out `behave --help` for details. Also have a look at the 'work-in-progress'
-feature of behave which comes in handy when writing new tests.
+    pytest test/bdd
+
+The BDD tests create databases for the tests. You can set name of the databases
+through configuration variables in your `pytest.ini`:
+
+ * `nominatim_test_db` defines the name of the temporary database created for
+    a single test (default: `test_nominatim`)
+ * `nominatim_api_test_db` defines the name of the database containing
+    the API test data, see also below (default: `test_api_nominatim`)
+ * `nominatim_template_db` defines the name of the template database used
+    for creating the temporary test databases. It contains some static setup
+    which usually doesn't change between imports of OSM data
+    (default: `test_template_nominatim`)
+
+To change other connection parameters for the PostgreSQL database, use
+the [libpq enivronment variables](https://www.postgresql.org/docs/current/libpq-envars.html).
+Never set a password through these variables. Use a
+[password file](https://www.postgresql.org/docs/current/libpq-pgpass.html) instead.
+
+The API test database and the template database are only created once and then
+left untouched. This is usually what you want because it speeds up subsequent
+runs of BDD tests. If you do change code that has an influence on the content
+of these databases, you can run pytest with the `--nominatim-purge` parameter
+and the databases will be dropped and recreated from scratch.
+
+When running the BDD tests with make (using `make tests` or `make bdd`), then
+the databases will always be purged.
+
+The temporary test database is usually dropped directly after the test, so
+it does not take up unnecessary space. If you want to keep the database around,
+for example while debugging a specific BDD test, use the parameter
+`--nominatim-keep-db`.
+
 
 ### API Tests (`test/bdd/api`)
 
 These tests are meant to test the different API endpoints and their parameters.
 They require to import several datasets into a test database. This is normally
 done automatically during setup of the test. The API test database is then
-kept around and reused in subsequent runs of behave. Use `behave -DREMOVE_TEMPLATE`
+kept around and reused in subsequent runs of behave. Use `--nominatim-purge`
 to force a reimport of the database.
 
 The official test dataset is saved in the file `test/testdb/apidb-test-data.pbf`
@@ -109,12 +109,12 @@ test the correctness of osm2pgsql. Each test will write some data into the `plac
 table (and optionally the `planet_osm_*` tables if required) and then run
 Nominatim's processing functions on that.
 
-These tests need to create their own test databases. By default they will be
-called `test_template_nominatim` and `test_nominatim`. Names can be changed with
-the environment variables `TEMPLATE_DB` and `TEST_DB`. The user running the tests
-needs superuser rights for postgres.
+These tests use the template database and create temporary test databases for
+each test.
 
 ### Import Tests (`test/bdd/osm2pgsql`)
 
-These tests check that data is imported correctly into the place table. They
-use the same template database as the DB Creation tests, so the same remarks apply.
+These tests check that data is imported correctly into the place table.
+
+These tests also use the template database and create temporary test databases
+for each test.
diff --git a/docs/develop/Tokenizers.md b/docs/develop/Tokenizers.md
index f4a55adc..a1dae78b 100644
--- a/docs/develop/Tokenizers.md
+++ b/docs/develop/Tokenizers.md
@@ -91,14 +91,19 @@ for a custom tokenizer implementation.
 
 ### Directory Structure
 
-Nominatim expects a single file `src/nominatim_db/tokenizer/<NAME>_tokenizer.py`
-containing the Python part of the implementation.
+Nominatim expects two files containing the Python part of the implementation:
+
+ * `src/nominatim_db/tokenizer/<NAME>_tokenizer.py` contains the tokenizer
+   code used during import and
+ * `src/nominatim_api/search/<NAME>_tokenizer.py` has the code used during
+   query time.
+
 `<NAME>` is a unique name for the tokenizer consisting of only lower-case
 letters, digits and underscore. A tokenizer also needs to install some SQL
 functions. By convention, these should be placed in `lib-sql/tokenizer`.
 
 If the tokenizer has a default configuration file, this should be saved in
-the `settings/<NAME>_tokenizer.<SUFFIX>`.
+`settings/<NAME>_tokenizer.<SUFFIX>`.
 
 ### Configuration and Persistence
 
@@ -110,9 +115,11 @@ are tied to a database installation and must only be read during installation
 time. If they are needed for the runtime then they must be saved into the
 `nominatim_properties` table and later loaded from there.
 
-### The Python module
+### The Python modules
 
-The Python module is expect to export a single factory function:
+#### `src/nominatim_db/tokenizer/`
+
+The import Python module is expected to export a single factory function:
 
 ```python
 def create(dsn: str, data_dir: Path) -> AbstractTokenizer
@@ -123,6 +130,20 @@ is a directory in the project directory that the tokenizer may use to save
 database-specific data. The function must return the instance of the tokenizer
 class as defined below.
 
+#### `src/nominatim_api/search/`
+
+The query-time Python module must also export a factory function:
+
+``` python
+def create_query_analyzer(conn: SearchConnection) -> AbstractQueryAnalyzer
+```
+
+The `conn` parameter contains the current search connection. See the
+[library documentation](../library/Low-Level-DB-Access.md#searchconnection-class)
+for details on the class. The function must return the instance of the tokenizer
+class as defined below.
+
+
 ### Python Tokenizer Class
 
 All tokenizers must inherit from `nominatim_db.tokenizer.base.AbstractTokenizer`
@@ -138,6 +159,13 @@ and implement the abstract functions defined there.
     options:
         heading_level: 6
 
+
+### Python Query Analyzer Class
+
+::: nominatim_api.search.query_analyzer_factory.AbstractQueryAnalyzer
+    options:
+        heading_level: 6
+
 ### PL/pgSQL Functions
 
 The tokenizer must provide access functions for the `token_info` column
diff --git a/docs/extra.css b/docs/extra.css
index 1decc478..033e9903 100644
--- a/docs/extra.css
+++ b/docs/extra.css
@@ -2,8 +2,8 @@
     display: none!important
 }
 
-.wy-nav-content {
-    max-width: 900px!important
+.md-content {
+    max-width: 800px
 }
 
 table {
diff --git a/lib-lua/flex-base.lua b/lib-lua/flex-base.lua
new file mode 100644
index 00000000..1173c53f
--- /dev/null
+++ b/lib-lua/flex-base.lua
@@ -0,0 +1,14 @@
+-- This is just an alias for the Nominatim themepark theme module
+local flex = require('themes/nominatim/init')
+
+function flex.load_topic(name, cfg)
+    local topic_file = debug.getinfo(1, "S").source:sub(2):match("(.*/)") .. 'themes/nominatim/topics/'.. name .. '.lua'
+
+    if topic_file == nil then
+        error('Cannot find topic: ' .. name)
+    end
+
+    loadfile(topic_file)(nil, flex, cfg or {})
+end
+
+return flex
diff --git a/lib-lua/import-address.lua b/lib-lua/import-address.lua
new file mode 100644
index 00000000..bec21505
--- /dev/null
+++ b/lib-lua/import-address.lua
@@ -0,0 +1,6 @@
+-- This is just an alias for the Nominatim themepark address topic
+local flex = require('flex-base')
+
+flex.load_topic('address')
+
+return flex
diff --git a/lib-lua/import-admin.lua b/lib-lua/import-admin.lua
new file mode 100644
index 00000000..8d1230a1
--- /dev/null
+++ b/lib-lua/import-admin.lua
@@ -0,0 +1,6 @@
+-- This is just an alias for the Nominatim themepark admin topic
+local flex = require('flex-base')
+
+flex.load_topic('admin')
+
+return flex
diff --git a/lib-lua/import-extratags.lua b/lib-lua/import-extratags.lua
new file mode 100644
index 00000000..53b1c81e
--- /dev/null
+++ b/lib-lua/import-extratags.lua
@@ -0,0 +1,6 @@
+-- This is just an alias for the Nominatim themepark full topic
+local flex = require('flex-base')
+
+flex.load_topic('full', {with_extratags = true})
+
+return flex
diff --git a/lib-lua/import-full.lua b/lib-lua/import-full.lua
new file mode 100644
index 00000000..59308a67
--- /dev/null
+++ b/lib-lua/import-full.lua
@@ -0,0 +1,6 @@
+-- This is just an alias for the Nominatim themepark full topic
+local flex = require('flex-base')
+
+flex.load_topic('full')
+
+return flex
diff --git a/lib-lua/import-street.lua b/lib-lua/import-street.lua
new file mode 100644
index 00000000..1a02b098
--- /dev/null
+++ b/lib-lua/import-street.lua
@@ -0,0 +1,6 @@
+-- This is just an alias for the Nominatim themepark street topic
+local flex = require('flex-base')
+
+flex.load_topic('street')
+
+return flex
diff --git a/lib-lua/taginfo.lua b/lib-lua/taginfo.lua
new file mode 100644
index 00000000..402499ad
--- /dev/null
+++ b/lib-lua/taginfo.lua
@@ -0,0 +1,118 @@
+-- Prints taginfo project description in the standard output
+--
+
+-- create fake "osm2pgsql" table for flex-base, originally created by the main C++ program
+osm2pgsql = {}
+function osm2pgsql.define_table(...) end
+
+-- provide path to flex-style lua file
+package.path = arg[0]:match("(.*/)") .. "?.lua;" .. package.path
+local flex = require('import-' .. (arg[1] or 'extratags'))
+local json = require ('dkjson')
+
+local NAME_DESCRIPTIONS = {
+    'Searchable auxiliary name of the place',
+    main = 'Searchable primary name of the place',
+    house = 'House name part of an address, searchable'
+}
+local ADDRESS_DESCRIPTIONS = {
+    'Used to determine the address of a place',
+    main = 'Primary key for an address point',
+    postcode = 'Used to determine the postcode of a place',
+    country = 'Used to determine country of a place (only if written as two-letter code)',
+    interpolation = 'Primary key for an address interpolation line'
+}
+
+------------ helper functions ---------------------
+-- Sets the key order for the resulting JSON table
+local function set_keyorder(table, order)
+    setmetatable(table, {
+        __jsonorder = order
+    })
+end
+
+local function get_key_description(key, description)
+    local desc = {}
+    desc.key = key
+    desc.description = description
+    set_keyorder(desc, {'key', 'description'})
+    return desc
+end
+
+local function get_key_value_description(key, value, description)
+    local desc = {key = key, value = value, description = description}
+    set_keyorder(desc, {'key', 'value', 'description'})
+    return desc
+end
+
+local function group_table_to_keys(tags, data, descriptions)
+    for group, values in pairs(data) do
+        local desc = descriptions[group] or descriptions[1]
+        for _, key in pairs(values) do
+            if key:sub(1, 1) ~= '*' and key:sub(#key, #key) ~= '*' then
+                table.insert(tags, get_key_description(key, desc))
+            end
+        end
+    end
+end
+
+-- Prints the collected tags in the required format in JSON
+local function print_taginfo()
+    local taginfo = flex.get_taginfo()
+    local tags = {}
+
+    for k, values in pairs(taginfo.main) do
+        if values[1] == nil or values[1] == 'delete' or values[1] == 'extra' then
+            for v, group in pairs(values) do
+                if type(v) == 'string' and group ~= 'delete' and group ~= 'extra' then
+                    local text = 'POI/feature in the search database'
+                    if type(group) ~= 'function' then
+                        text = 'Fallback ' .. text
+                    end
+                    table.insert(tags, get_key_value_description(k, v, text))
+                end
+            end
+        elseif type(values[1]) == 'function' or values[1] == 'fallback' then
+            local desc = 'POI/feature in the search database'
+            if values[1] == 'fallback' then
+                desc = 'Fallback ' .. desc
+            end
+            local excp = {}
+            for v, group in pairs(values) do
+                if group == 'delete' or group == 'extra' then
+                    table.insert(excp, v)
+                end
+            end
+            if next(excp) ~= nil then
+                desc = desc .. string.format(' (except for values: %s)',
+                                             table.concat(excp, ', '))
+            end
+            table.insert(tags, get_key_description(k, desc))
+        end
+    end
+
+    group_table_to_keys(tags, taginfo.name, NAME_DESCRIPTIONS)
+    group_table_to_keys(tags, taginfo.address, ADDRESS_DESCRIPTIONS)
+
+    local format = {
+        data_format = 1,
+        data_url = 'https://nominatim.openstreetmap.org/taginfo.json',
+        project = {
+            name = 'Nominatim',
+            description = 'OSM search engine.',
+            project_url = 'https://nominatim.openstreetmap.org',
+            doc_url = 'https://nominatim.org/release-docs/develop/',
+            contact_name = 'Sarah Hoffmann',
+            contact_email = 'lonvia@denofr.de'
+        }
+    }
+    format.tags = tags
+
+    set_keyorder(format, {'data_format', 'data_url', 'project', 'tags'})
+    set_keyorder(format.project, {'name', 'description', 'project_url', 'doc_url',
+                    'contact_name', 'contact_email'})
+
+    print(json.encode(format))
+end
+
+print_taginfo()
diff --git a/lib-lua/themes/nominatim/init.lua b/lib-lua/themes/nominatim/init.lua
new file mode 100644
index 00000000..fef86f91
--- /dev/null
+++ b/lib-lua/themes/nominatim/init.lua
@@ -0,0 +1,925 @@
+-- Nominatim themepark theme.
+--
+-- The Nominatim theme creates a fixed set of import tables for use with
+-- Nominatim. Creation and object processing are directly controlled by
+-- the theme. Topics provide preset configurations. You should add exactly
+-- one topic to your project.
+--
+-- The theme also exports a number of functions that can be used to configure
+-- its behaviour. These may be directly called in the style file after
+-- importing the theme:
+--
+--      local nominatim = themepark:init_theme('nominatim')
+--      nominatim.set_main_tags{boundary = 'always'}
+--
+-- This allows to write your own configuration from scratch. You can also
+-- use it to customize topics. In that case, first add the topic, then
+-- change the configuration:
+--
+--      themepark:add_topic('nominatim/full')
+--      local nominatim = themepark:init_theme('nominatim')
+--      nominatim.ignore_tags{'amenity'}
+
+local module = {}
+
+local MAIN_KEYS = {admin_level = {'delete'}}
+local PRE_FILTER = {prefix = {}, suffix = {}}
+local NAMES = {}
+local NAME_FILTER = nil
+local ADDRESS_TAGS = {}
+local ADDRESS_FILTER = nil
+local EXTRATAGS_FILTER
+local POSTCODE_FALLBACK = true
+
+-- This file can also be directly require'd instead of running it under
+-- the themepark framework. In that case the first parameter is usually
+-- the module name. Lets check for that, so that further down we can call
+-- the low-level osm2pgsql functions instead of themepark functions.
+local themepark = ...
+if type(themepark) ~= 'table' then
+    themepark = nil
+end
+
+-- The single place table.
+local place_table_definition = {
+    name = "place",
+    ids = { type = 'any', id_column = 'osm_id', type_column = 'osm_type' },
+    columns = {
+        { column = 'class', type = 'text', not_null = true },
+        { column = 'type', type = 'text', not_null = true },
+        { column = 'admin_level', type = 'smallint' },
+        { column = 'name', type = 'hstore' },
+        { column = 'address', type = 'hstore' },
+        { column = 'extratags', type = 'hstore' },
+        { column = 'geometry', type = 'geometry', projection = 'WGS84', not_null = true },
+    },
+    data_tablespace = os.getenv("NOMINATIM_TABLESPACE_PLACE_DATA"),
+    index_tablespace = os.getenv("NOMINATIM_TABLESPACE_PLACE_INDEX"),
+    indexes = {}
+}
+
+local insert_row
+local script_path = debug.getinfo(1, "S").source:match("@?(.*/)")
+local PRESETS = loadfile(script_path .. 'presets.lua')()
+
+if themepark then
+    themepark:add_table(place_table_definition)
+    insert_row = function(columns)
+        themepark:insert('place', columns, {}, {})
+    end
+else
+    local place_table = osm2pgsql.define_table(place_table_definition)
+    insert_row = function(columns)
+        place_table:insert(columns)
+    end
+end
+
+------------ Geometry functions for relations ---------------------
+
+function module.relation_as_multipolygon(o)
+    return o:as_multipolygon()
+end
+
+function module.relation_as_multiline(o)
+    return o:as_multilinestring():line_merge()
+end
+
+
+module.RELATION_TYPES = {
+    multipolygon = module.relation_as_multipolygon,
+    boundary = module.relation_as_multipolygon,
+    waterway = module.relation_as_multiline
+}
+
+--------- Built-in place transformation functions --------------------------
+
+local PlaceTransform = {}
+
+-- Special transform meanings which are interpreted elsewhere
+PlaceTransform.fallback = 'fallback'
+PlaceTransform.delete = 'delete'
+PlaceTransform.extra = 'extra'
+
+-- always: unconditionally use that place
+function PlaceTransform.always(place)
+    return place
+end
+
+-- never: unconditionally drop the place
+function PlaceTransform.never()
+    return nil
+end
+
+-- named: use the place if it has a fully-qualified name
+function PlaceTransform.named(place)
+    if place.has_name then
+        return place
+    end
+end
+
+-- named_with_key: use place if there is a name with the main key prefix
+function PlaceTransform.named_with_key(place, k)
+    local names = {}
+    local prefix = k .. ':name'
+    for namek, namev in pairs(place.intags) do
+        if namek:sub(1, #prefix) == prefix
+           and (#namek == #prefix
+                or namek:sub(#prefix + 1, #prefix + 1) == ':') then
+            names[namek:sub(#k + 2)] = namev
+        end
+    end
+
+    if next(names) ~= nil then
+        return place:clone{names=names}
+    end
+end
+
+-- Special transform used with address fallbacks: ignore all names
+-- except for those marked as being part of the address.
+local function address_fallback(place)
+    if next(place.names) == nil or NAMES.house == nil then
+        return place
+    end
+
+    local names = {}
+    for k, v in pairs(place.names) do
+        if NAME_FILTER(k, v) == 'house' then
+            names[k] = v
+        end
+    end
+    return place:clone{names=names}
+end
+
+--------- Built-in extratags transformation functions ---------------
+
+local function default_extratags_filter(p, k)
+    -- Default handling is to copy over place tag for boundaries.
+    -- Nominatim needs this.
+    if k ~= 'boundary' or p.intags.place == nil then
+        return p.extratags
+    end
+
+    local extra = { place = p.intags.place }
+    for kin, vin in pairs(p.extratags) do
+        extra[kin] = vin
+    end
+
+    return extra
+end
+EXTRATAGS_FILTER = default_extratags_filter
+
+----------------- other helper functions -----------------------------
+
+local function lookup_prefilter_classification(k, v)
+    -- full matches
+    local desc = MAIN_KEYS[k]
+    local fullmatch = desc and (desc[v] or desc[1])
+    if fullmatch ~= nil then
+        return fullmatch
+    end
+    -- suffixes
+    for slen, slist in pairs(PRE_FILTER.suffix) do
+        if #k >= slen then
+            local group = slist[k:sub(-slen)]
+            if group ~= nil then
+                return group
+            end
+        end
+    end
+    -- prefixes
+    for slen, slist in pairs(PRE_FILTER.prefix) do
+        if #k >= slen then
+            local group = slist[k:sub(1, slen)]
+            if group ~= nil then
+                return group
+            end
+        end
+    end
+end
+
+
+local function merge_filters_into_main(group, keys, tags)
+    if keys ~= nil then
+        for _, key in pairs(keys) do
+            -- ignore suffix and prefix matches
+            if key:sub(1, 1) ~= '*' and key:sub(#key, #key) ~= '*' then
+                if MAIN_KEYS[key] == nil then
+                    MAIN_KEYS[key] = {}
+                end
+                MAIN_KEYS[key][1] = group
+            end
+        end
+    end
+
+    if tags ~= nil then
+        for key, values in pairs(tags) do
+            if MAIN_KEYS[key] == nil then
+                MAIN_KEYS[key] = {}
+            end
+            for _, v in pairs(values) do
+                MAIN_KEYS[key][v] = group
+            end
+        end
+    end
+end
+
+
+local function remove_group_from_main(group)
+    for key, values in pairs(MAIN_KEYS) do
+        for _, ttype in pairs(values) do
+            if ttype == group then
+                values[ttype] = nil
+            end
+        end
+        if next(values) == nil then
+            MAIN_KEYS[key] = nil
+        end
+    end
+end
+
+
+local function add_pre_filter(data)
+    for group, keys in pairs(data) do
+        for _, key in pairs(keys) do
+            local klen = #key - 1
+            if key:sub(1, 1) == '*' then
+                if klen > 0 then
+                    if PRE_FILTER.suffix[klen] == nil then
+                        PRE_FILTER.suffix[klen] = {}
+                    end
+                    PRE_FILTER.suffix[klen][key:sub(2)] = group
+                end
+            elseif key:sub(#key, #key) == '*' then
+                if PRE_FILTER.prefix[klen] == nil then
+                    PRE_FILTER.prefix[klen] = {}
+                end
+                PRE_FILTER.prefix[klen][key:sub(1, klen)] = group
+            end
+        end
+    end
+end
+
+------------- Place class ------------------------------------------
+
+local Place = {}
+Place.__index = Place
+
+function Place.new(object, geom_func)
+    local self = setmetatable({}, Place)
+    self.object = object
+    self.geom_func = geom_func
+
+    self.admin_level = tonumber(self.object.tags.admin_level or 15) or 15
+    if self.admin_level == nil
+       or self.admin_level <= 0 or self.admin_level > 15
+       or math.floor(self.admin_level) ~= self.admin_level then
+        self.admin_level = 15
+    end
+
+    self.num_entries = 0
+    self.has_name = false
+    self.names = {}
+    self.address = {}
+    self.extratags = {}
+
+    self.intags = {}
+
+    local has_main_tags = false
+    for k, v in pairs(self.object.tags) do
+        local group = lookup_prefilter_classification(k, v)
+        if group == 'extra' then
+            self.extratags[k] = v
+        elseif group ~= 'delete' then
+            self.intags[k] = v
+            if group ~= nil then
+                has_main_tags = true
+            end
+        end
+    end
+
+    if not has_main_tags then
+        -- no interesting tags, don't bother processing
+        self.intags = {}
+    end
+
+    return self
+end
+
+function Place:clean(data)
+    for k, v in pairs(self.intags) do
+        if data.delete ~= nil and data.delete(k, v) then
+            self.intags[k] = nil
+        elseif data.extra ~= nil and data.extra(k, v) then
+            self.extratags[k] = v
+            self.intags[k] = nil
+        end
+    end
+end
+
+function Place:delete(data)
+    if data.match ~= nil then
+        for k, v in pairs(self.intags) do
+            if data.match(k, v) then
+                self.intags[k] = nil
+            end
+        end
+    end
+end
+
+function Place:grab_extratags(data)
+    local count = 0
+
+    if data.match ~= nil then
+        for k, v in pairs(self.intags) do
+            if data.match(k, v) then
+                self.intags[k] = nil
+                self.extratags[k] = v
+                count = count + 1
+            end
+        end
+    end
+
+    return count
+end
+
+local function strip_address_prefix(k)
+    if k:sub(1, 5) == 'addr:' then
+        return k:sub(6)
+    end
+
+    if k:sub(1, 6) == 'is_in:' then
+        return k:sub(7)
+    end
+
+    return k
+end
+
+
+function Place:grab_address_parts(data)
+    local count = 0
+
+    if data.groups ~= nil then
+        for k, v in pairs(self.intags) do
+            local atype = data.groups(k, v)
+
+            if atype ~= nil then
+                if atype == 'main' then
+                    self.has_name = true
+                    self.address[strip_address_prefix(k)] = v
+                    count = count + 1
+                elseif atype == 'extra' then
+                    self.address[strip_address_prefix(k)] = v
+                else
+                    self.address[atype] = v
+                end
+                self.intags[k] = nil
+            end
+        end
+    end
+
+    return count
+end
+
+
+function Place:grab_name_parts(data)
+    local fallback = nil
+
+    if data.groups ~= nil then
+        for k, v in pairs(self.intags) do
+            local atype = data.groups(k, v)
+
+            if atype ~= nil then
+                self.names[k] = v
+                self.intags[k] = nil
+                if atype == 'main' then
+                    self.has_name = true
+                elseif atype == 'house' then
+                    self.has_name = true
+                    fallback = {'place', 'house', address_fallback}
+                end
+            end
+        end
+    end
+
+    return fallback
+end
+
+
+function Place:write_place(k, v, mfunc)
+    v = v or self.intags[k]
+    if v == nil then
+        return 0
+    end
+
+    local place = mfunc(self, k, v)
+    if place then
+        local res = place:write_row(k, v)
+        self.num_entries = self.num_entries + res
+        return res
+    end
+
+    return 0
+end
+
+function Place:write_row(k, v)
+    if self.geometry == nil then
+        self.geometry = self.geom_func(self.object)
+    end
+    if self.geometry == nil or self.geometry:is_null() then
+        return 0
+    end
+
+    local extratags = EXTRATAGS_FILTER(self, k, v)
+    if not (extratags and next(extratags)) then
+        extratags = nil
+    end
+
+    insert_row{
+        class = k,
+        type = v,
+        admin_level = self.admin_level,
+        name = next(self.names) and self.names,
+        address = next(self.address) and self.address,
+        extratags = extratags,
+        geometry = self.geometry
+    }
+
+    return 1
+end
+
+
+function Place:clone(data)
+    local cp = setmetatable({}, Place)
+    cp.object = self.object
+    cp.geometry = data.geometry or self.geometry
+    cp.geom_func = self.geom_func
+    cp.intags = data.intags or self.intags
+    cp.admin_level = data.admin_level or self.admin_level
+    cp.names = data.names or self.names
+    cp.address = data.address or self.address
+    cp.extratags = data.extratags or self.extratags
+
+    return cp
+end
+
+
+function module.tag_match(data)
+    if data == nil or next(data) == nil then
+        return nil
+    end
+
+    local fullmatches = {}
+    local key_prefixes = {}
+    local key_suffixes = {}
+
+    if data.keys ~= nil then
+        for _, key in pairs(data.keys) do
+            if key:sub(1, 1) == '*' then
+                if #key > 1 then
+                    if key_suffixes[#key - 1] == nil then
+                        key_suffixes[#key - 1] = {}
+                    end
+                    key_suffixes[#key - 1][key:sub(2)] = true
+                end
+            elseif key:sub(#key, #key) == '*' then
+                if key_prefixes[#key - 1] == nil then
+                    key_prefixes[#key - 1] = {}
+                end
+                key_prefixes[#key - 1][key:sub(1, #key - 1)] = true
+            else
+                fullmatches[key] = true
+            end
+        end
+    end
+
+    if data.tags ~= nil then
+        for k, vlist in pairs(data.tags) do
+            if fullmatches[k] == nil then
+                fullmatches[k] = {}
+                for _, v in pairs(vlist) do
+                    fullmatches[k][v] = true
+                end
+            end
+        end
+    end
+
+    return function (k, v)
+        if fullmatches[k] ~= nil and (fullmatches[k] == true or fullmatches[k][v] ~= nil) then
+            return true
+        end
+
+        for slen, slist in pairs(key_suffixes) do
+            if #k >= slen and slist[k:sub(-slen)] ~= nil then
+                return true
+            end
+        end
+
+        for slen, slist in pairs(key_prefixes) do
+            if #k >= slen and slist[k:sub(1, slen)] ~= nil then
+                return true
+            end
+        end
+
+        return false
+    end
+end
+
+
+function module.tag_group(data)
+    if data == nil or next(data) == nil then
+        return nil
+    end
+
+    local fullmatches = {}
+    local key_prefixes = {}
+    local key_suffixes = {}
+
+    for group, tags in pairs(data) do
+        for _, key in pairs(tags) do
+            if key:sub(1, 1) == '*' then
+                if #key > 1 then
+                    if key_suffixes[#key - 1] == nil then
+                        key_suffixes[#key - 1] = {}
+                    end
+                    key_suffixes[#key - 1][key:sub(2)] = group
+                end
+            elseif key:sub(#key, #key) == '*' then
+                if key_prefixes[#key - 1] == nil then
+                    key_prefixes[#key - 1] = {}
+                end
+                key_prefixes[#key - 1][key:sub(1, #key - 1)] = group
+            else
+                fullmatches[key] = group
+            end
+        end
+    end
+
+    return function (k)
+        local val = fullmatches[k]
+        if val ~= nil then
+            return val
+        end
+
+        for slen, slist in pairs(key_suffixes) do
+            if #k >= slen then
+                val = slist[k:sub(-slen)]
+                if val ~= nil then
+                    return val
+                end
+            end
+        end
+
+        for slen, slist in pairs(key_prefixes) do
+            if #k >= slen then
+                val = slist[k:sub(1, slen)]
+                if val ~= nil then
+                    return val
+                end
+            end
+        end
+    end
+end
+
+-- Returns prefix part of the keys, and reject suffix matching keys
+local function process_key(key)
+    if key:sub(1, 1) == '*' then
+        return nil
+    end
+    if key:sub(#key, #key) == '*' then
+        return key:sub(1, #key - 2)
+    end
+    return key
+end
+
+-- Process functions for all data types
+function module.process_node(object)
+
+    local function geom_func(o)
+        return o:as_point()
+    end
+
+    module.process_tags(Place.new(object, geom_func))
+end
+
+function module.process_way(object)
+
+    local function geom_func(o)
+        local geom = o:as_polygon()
+
+        if geom:is_null() then
+            geom = o:as_linestring()
+            if geom:is_null() or geom:length() > 30 then
+                return nil
+            end
+        end
+
+        return geom
+    end
+
+    module.process_tags(Place.new(object, geom_func))
+end
+
+function module.process_relation(object)
+    local geom_func = module.RELATION_TYPES[object.tags.type]
+
+    if geom_func ~= nil then
+        module.process_tags(Place.new(object, geom_func))
+    end
+end
+
+-- The process functions are used by default by osm2pgsql.
+if themepark then
+    themepark:add_proc('node', module.process_node)
+    themepark:add_proc('way', module.process_way)
+    themepark:add_proc('relation', module.process_relation)
+else
+    osm2pgsql.process_node = module.process_node
+    osm2pgsql.process_way = module.process_way
+    osm2pgsql.process_relation = module.process_relation
+end
+
+function module.process_tags(o)
+    if next(o.intags) == nil then
+        return  -- shortcut when pre-filtering has removed all tags
+    end
+
+    -- Exception for boundary/place double tagging
+    if o.intags.boundary == 'administrative' then
+        o:grab_extratags{match = function (k, v)
+            return k == 'place' and v:sub(1,3) ~= 'isl'
+        end}
+    end
+
+    -- name keys
+    local fallback = o:grab_name_parts{groups=NAME_FILTER}
+
+    -- address keys
+    if o:grab_address_parts{groups=ADDRESS_FILTER} > 0 and fallback == nil then
+        fallback = {'place', 'house', address_fallback}
+    end
+    if o.address.country ~= nil and #o.address.country ~= 2 then
+        o.address['country'] = nil
+    end
+    if POSTCODE_FALLBACK and fallback == nil and o.address.postcode ~= nil then
+        fallback = {'place', 'postcode', PlaceTransform.always}
+    end
+
+    if o.address.interpolation ~= nil then
+        o:write_place('place', 'houses', PlaceTransform.always)
+        return
+    end
+
+    -- collect main keys
+    for k, v in pairs(o.intags) do
+        local ktable = MAIN_KEYS[k]
+        if ktable then
+            local ktype = ktable[v] or ktable[1]
+            if type(ktype) == 'function' then
+                o:write_place(k, v, ktype)
+            elseif ktype == 'fallback' and o.has_name then
+                fallback = {k, v, PlaceTransform.named}
+            end
+        end
+    end
+
+    if fallback ~= nil and o.num_entries == 0 then
+        o:write_place(fallback[1], fallback[2], fallback[3])
+    end
+end
+
+--------- Convenience functions for simple style configuration -----------------
+
+function module.set_prefilters(data)
+    remove_group_from_main('delete')
+    merge_filters_into_main('delete', data.delete_keys, data.delete_tags)
+
+    remove_group_from_main('extra')
+    merge_filters_into_main('extra', data.extra_keys, data.extra_tags)
+
+    PRE_FILTER = {prefix = {}, suffix = {}}
+    add_pre_filter{delete = data.delete_keys, extra = data.extra_keys}
+end
+
+
+function module.ignore_keys(data)
+    if type(data) == 'string' then
+        local preset = data
+        data = PRESETS.IGNORE_KEYS[data]
+        if data == nil then
+            error('Unknown preset for ignored keys: ' .. preset)
+        end
+    end
+    merge_filters_into_main('delete', data)
+    add_pre_filter{delete = data}
+end
+
+
+function module.add_for_extratags(data)
+    if type(data) == 'string' then
+        local preset = data
+        data = PRESETS.EXTRATAGS[data] or PRESETS.IGNORE_KEYS[data]
+        if data == nil then
+            error('Unknown preset for extratags: ' .. preset)
+        end
+    end
+    merge_filters_into_main('extra', data)
+    add_pre_filter{extra = data}
+end
+
+
+function module.set_main_tags(data)
+    for key, values in pairs(MAIN_KEYS) do
+        for _, ttype in pairs(values) do
+            if ttype == 'fallback' or type(ttype) == 'function' then
+                values[ttype] = nil
+            end
+        end
+        if next(values) == nil then
+            MAIN_KEYS[key] = nil
+        end
+    end
+    module.modify_main_tags(data)
+end
+
+
+function module.modify_main_tags(data)
+    if type(data) == 'string' then
+        local preset = data
+        if data:sub(1, 7) == 'street/' then
+            data = PRESETS.MAIN_TAGS_STREETS[data:sub(8)]
+        elseif data:sub(1, 4) == 'poi/' then
+            data = PRESETS.MAIN_TAGS_POIS(data:sub(5))
+        else
+            data = PRESETS.MAIN_TAGS[data]
+        end
+        if data == nil then
+            error('Unknown preset for main tags: ' .. preset)
+        end
+    end
+
+    for k, v in pairs(data) do
+        if MAIN_KEYS[k] == nil then
+            MAIN_KEYS[k] = {}
+        end
+        if type(v) == 'function' then
+            MAIN_KEYS[k][1] = v
+        elseif type(v) == 'string' then
+            MAIN_KEYS[k][1] = PlaceTransform[v]
+        elseif type(v) == 'table' then
+            for subk, subv in pairs(v) do
+                if type(subv) == 'function' then
+                    MAIN_KEYS[k][subk] = subv
+                else
+                    MAIN_KEYS[k][subk] = PlaceTransform[subv]
+                end
+            end
+        end
+    end
+end
+
+
+function module.modify_name_tags(data)
+    if type(data) == 'string' then
+        local preset = data
+        data = PRESETS.NAME_TAGS[data]
+        if data == nil then
+            error('Unknown preset for name keys: ' .. preset)
+        end
+    end
+
+    for k,v in pairs(data) do
+        if next(v) then
+            NAMES[k] = v
+        else
+            NAMES[k] = nil
+        end
+    end
+    NAME_FILTER = module.tag_group(NAMES)
+    remove_group_from_main('fallback:name')
+    if data.house ~= nil then
+        merge_filters_into_main('fallback:name', data.house)
+    end
+end
+
+
+function module.set_name_tags(data)
+    NAMES = {}
+    module.modify_name_tags(data)
+end
+
+
+function module.set_address_tags(data)
+    ADDRESS_TAGS = {}
+    module.modify_address_tags(data)
+end
+
+
+function module.modify_address_tags(data)
+    if type(data) == 'string' then
+        local preset = data
+        data = PRESETS.ADDRESS_TAGS[data]
+        if data == nil then
+            error('Unknown preset for address keys: ' .. preset)
+        end
+    end
+
+    for k, v in pairs(data) do
+        if k == 'postcode_fallback' then
+            POSTCODE_FALLBACK = v
+        elseif next(v) == nil then
+            ADDRESS_TAGS[k] = nil
+        else
+            ADDRESS_TAGS[k] = v
+        end
+    end
+
+    ADDRESS_FILTER = module.tag_group(ADDRESS_TAGS)
+
+    remove_group_from_main('fallback:address')
+    merge_filters_into_main('fallback:address', data.main)
+    merge_filters_into_main('fallback:address', data.interpolation)
+    remove_group_from_main('fallback:postcode')
+    if POSTCODE_FALLBACK then
+        merge_filters_into_main('fallback:postcode', data.postcode)
+    end
+end
+
+
+function module.set_address_tags(data)
+    ADDRESS_TAGS_SOURCE = {}
+    module.modify_address_tags(data)
+end
+
+
+function module.set_postcode_fallback(enable)
+    if POSTCODE_FALLBACK ~= enable then
+        remove_group_from_main('fallback:postcode')
+        if enable then
+            merge_filters_into_main('fallback:postcode', ADDRESS_TAGS.postcode)
+        end
+    end
+    POSTCODE_FALLBACK = enable
+end
+
+
+function module.set_unused_handling(data)
+    if type(data) == 'function' then
+        EXTRATAGS_FILTER = data
+    elseif data == nil then
+        EXTRATAGS_FILTER = default_extratags_filter
+    elseif data.extra_keys == nil and data.extra_tags == nil then
+        local delfilter = module.tag_match{keys = data.delete_keys, tags = data.delete_tags}
+        EXTRATAGS_FILTER = function (p, k)
+            local extra = {}
+            for kin, vin in pairs(p.intags) do
+                if kin ~= k and not delfilter(kin, vin) then
+                    extra[kin] = vin
+                end
+            end
+            if next(extra) == nil then
+                return p.extratags
+            end
+            for kextra, vextra in pairs(p.extratags) do
+                extra[kextra] = vextra
+            end
+            return extra
+        end
+    elseif data.delete_keys == nil and data.delete_tags == nil then
+        local incfilter = module.tag_match{keys = data.extra_keys, tags = data.extra_tags}
+        EXTRATAGS_FILTER = function (p, k)
+            local extra = {}
+            for kin, vin in pairs(p.intags) do
+                if kin ~= k and incfilter(kin, vin) then
+                    extra[kin] = vin
+                end
+            end
+            if next(extra) == nil then
+                return p.extratags
+            end
+            for kextra, vextra in pairs(p.extratags) do
+                extra[kextra] = vextra
+            end
+            return extra
+        end
+    else
+        error("unused handler can have only 'extra_keys' or 'delete_keys' set.")
+    end
+end
+
+function module.set_relation_types(data)
+    module.RELATION_TYPES = {}
+    for k, v in data do
+        if v == 'multipolygon' then
+            module.RELATION_TYPES[k] = module.relation_as_multipolygon
+        elseif v == 'multiline' then
+            module.RELATION_TYPES[k] = module.relation_as_multiline
+        end
+    end
+end
+
+
+function module.get_taginfo()
+    return {main = MAIN_KEYS, name = NAMES, address = ADDRESS_TAGS}
+end
+
+return module
diff --git a/lib-lua/themes/nominatim/presets.lua b/lib-lua/themes/nominatim/presets.lua
new file mode 100644
index 00000000..00ff0f52
--- /dev/null
+++ b/lib-lua/themes/nominatim/presets.lua
@@ -0,0 +1,382 @@
+-- Defines defaults used in the topic definitions.
+
+local module = {}
+
+-- Helper functions
+
+local function group_merge(group1, group2)
+    for name, values in pairs(group2) do
+        if group1[name] == nil then
+            group1[name] = values
+        else
+            for _, v in pairs(values) do
+                table.insert(group1[name], v)
+            end
+        end
+    end
+
+    return group1
+end
+
+-- Customized main tag filter functions
+
+local EXCLUDED_FOOTWAYS = { sidewalk = 1, crossing = 1, link = 1, traffic_aisle }
+
+local function filter_footways(place)
+    if place.has_name then
+        local footway = place.object.tags.footway
+        if footway == nil or EXCLUDED_FOOTWAYS[footway] ~= 1 then
+            return place
+        end
+    end
+    return false
+end
+
+local function include_when_tag_present(key, value, named)
+    if named then
+        return function(place)
+                   if place.has_name and place.intags[key] == value then
+                       return place
+                   end
+                   return false
+               end
+    else
+        return function(place)
+                   if place.intags[key] == value then
+                       return place
+                   end
+                   return false
+               end
+    end
+end
+
+local function exclude_when_key_present(key, named)
+    if named then
+        return function(place)
+                   if place.has_name and place.intags[key] == nil then
+                       return place
+                   end
+                   return false
+               end
+    else
+        return function(place)
+                   if place.intags[key] == nil then
+                       return place
+                   end
+                   return false
+               end
+
+    end
+end
+
+local function lock_transform(place)
+    if place.object.tags.waterway ~= nil then
+        local name = place.object.tags.lock_name
+        if name ~= nil then
+            return place:clone{names={name=name, ref=place.object.tags.lock_ref}}
+        end
+    end
+
+    return false
+end
+
+-- Main tag definition
+
+module.MAIN_TAGS = {}
+
+module.MAIN_TAGS.admin = {
+    boundary = {administrative = 'named'},
+    landuse = {residential = 'fallback',
+               farm = 'fallback',
+               farmyard = 'fallback',
+               industrial = 'fallback',
+               commercial = 'fallback',
+               allotments = 'fallback',
+               retail = 'fallback'},
+    place = {county = 'always',
+             district = 'always',
+             municipality = 'always',
+             city = 'always',
+             town = 'always',
+             borough = 'always',
+             village = 'always',
+             suburb = 'always',
+             hamlet = 'always',
+             croft = 'always',
+             subdivision = 'always',
+             allotments = 'always',
+             neighbourhood = 'always',
+             quarter = 'always',
+             isolated_dwelling = 'always',
+             farm = 'always',
+             city_block = 'always',
+             locality = 'always'}
+}
+
+module.MAIN_TAGS.all_boundaries = {
+    boundary = {'named',
+                place = 'delete',
+                land_area = 'delete',
+                postal_code = 'always'},
+    landuse = 'fallback',
+    place = 'always'
+}
+
+module.MAIN_TAGS.natural = {
+    waterway = {'named',
+                riverbank = 'delete'},
+    natural = {'named',
+               yes = 'delete',
+               no = 'delete',
+               coastline = 'delete',
+               saddle = 'fallback',
+               water = exclude_when_key_present('water', true)},
+    mountain_pass = {'always',
+                     no = 'delete'},
+    water = {include_when_tag_present('natural', 'water', true),
+             river = 'never',
+             stream = 'never',
+             canal = 'never',
+             ditch = 'never',
+             drain = 'never',
+             fish_pass = 'never',
+             yes = 'delete',
+             intermittent = 'delete',
+             tidal = 'delete'
+             }
+}
+
+module.MAIN_TAGS_POIS = function (group)
+    group = group or 'delete'
+    return {
+    aerialway = {'always',
+                 no = group,
+                 pylon = group},
+    aeroway = {'always',
+               no = group},
+    amenity = {'always',
+               no = group,
+               parking_space = group,
+               parking_entrance = group,
+               waste_disposal = group,
+               hunting_stand = group},
+    building = {'fallback',
+                no = group},
+    bridge = {'named_with_key',
+              no = group},
+    club = {'always',
+            no = group},
+    craft = {'always',
+             no = group},
+    emergency = {'always',
+                 no = group,
+                 yes = group,
+                 fire_hydrant = group},
+    healthcare = {'fallback',
+                  yes = group,
+                  no = group},
+    highway = {'always',
+               no = group,
+               turning_circle = group,
+               mini_roundabout = group,
+               noexit = group,
+               crossing = group,
+               give_way = group,
+               stop = group,
+               turning_loop = group,
+               passing_place = group,
+               street_lamp = 'named',
+               traffic_signals = 'named'},
+    historic = {'fallback',
+                yes = group,
+                no = group},
+    information = {include_when_tag_present('tourism', 'information'),
+                   yes = 'delete',
+                   route_marker = 'never',
+                   trail_blaze = 'never'},
+    junction = {'fallback',
+                no = group},
+    landuse = {cemetery = 'always'},
+    leisure = {'always',
+               nature_reserve = 'fallback',
+               swimming_pool = 'named',
+               no = group},
+    lock = {yes = lock_transform},
+    man_made = {pier = 'always',
+                tower = 'always',
+                bridge = 'always',
+                works = 'named',
+                water_tower = 'always',
+                dyke = 'named',
+                adit = 'named',
+                lighthouse = 'always',
+                watermill = 'always',
+                tunnel = 'always'},
+    military = {'always',
+                yes = group,
+                no = group},
+    office = {'always',
+              no = group},
+    railway = {'named',
+               rail = group,
+               no = group,
+               abandoned = group,
+               disused = group,
+               razed = group,
+               level_crossing = group,
+               switch = group,
+               signal = group,
+               buffer_stop = group},
+    shop = {'always',
+            no = group},
+    tourism = {'always',
+               attraction = 'fallback',
+               no = group,
+               yes = group,
+               information = exclude_when_key_present('information')},
+    tunnel = {'named_with_key',
+              no = group}
+} end
+
+module.MAIN_TAGS_STREETS = {}
+
+module.MAIN_TAGS_STREETS.default = {
+    place = {square = 'always'},
+    highway = {motorway = 'always',
+               trunk = 'always',
+               primary = 'always',
+               secondary = 'always',
+               tertiary = 'always',
+               unclassified = 'always',
+               residential = 'always',
+               road = 'always',
+               living_street = 'always',
+               pedestrian = 'always',
+               service = 'named',
+               cycleway = 'named',
+               path = 'named',
+               footway = filter_footways,
+               steps = 'named',
+               bridleway = 'named',
+               track = 'named',
+               motorway_link = 'named',
+               trunk_link = 'named',
+               primary_link = 'named',
+               secondary_link = 'named',
+               tertiary_link = 'named'}
+}
+
+module.MAIN_TAGS_STREETS.car = {
+    place = {square = 'always'},
+    highway = {motorway = 'always',
+               trunk = 'always',
+               primary = 'always',
+               secondary = 'always',
+               tertiary = 'always',
+               unclassified = 'always',
+               residential = 'always',
+               road = 'always',
+               living_street = 'always',
+               service = 'always',
+               track = 'always',
+               motorway_link = 'always',
+               trunk_link = 'always',
+               primary_link = 'always',
+               secondary_link = 'always',
+               tertiary_link = 'always'}
+}
+
+module.MAIN_TAGS_STREETS.all = {
+    place = {square = 'always'},
+    highway = {motorway = 'always',
+               trunk = 'always',
+               primary = 'always',
+               secondary = 'always',
+               tertiary = 'always',
+               unclassified = 'always',
+               residential = 'always',
+               road = 'always',
+               living_street = 'always',
+               pedestrian = 'always',
+               service = 'always',
+               cycleway = 'always',
+               path = 'always',
+               footway = 'always',
+               steps = 'always',
+               bridleway = 'always',
+               track = 'always',
+               motorway_link = 'always',
+               trunk_link = 'always',
+               primary_link = 'always',
+               secondary_link = 'always',
+               tertiary_link = 'always'}
+}
+
+
+-- name tags
+
+module.NAME_TAGS = {}
+
+module.NAME_TAGS.core = {main = {'name', 'name:*',
+                                 'int_name', 'int_name:*',
+                                 'nat_name', 'nat_name:*',
+                                 'reg_name', 'reg_name:*',
+                                 'loc_name', 'loc_name:*',
+                                 'old_name', 'old_name:*',
+                                 'alt_name', 'alt_name:*', 'alt_name_*',
+                                 'official_name', 'official_name:*',
+                                 'place_name', 'place_name:*',
+                                 'short_name', 'short_name:*'},
+                         extra = {'ref', 'int_ref', 'nat_ref', 'reg_ref',
+                                  'loc_ref', 'old_ref', 'ISO3166-2'}
+                        }
+module.NAME_TAGS.address = {house = {'addr:housename'}}
+module.NAME_TAGS.poi = group_merge({main = {'brand'},
+                                    extra = {'iata', 'icao'}},
+                                   module.NAME_TAGS.core)
+
+-- Address tagging
+
+module.ADDRESS_TAGS = {}
+
+module.ADDRESS_TAGS.core = { extra = {'addr:*', 'is_in:*', 'tiger:county'},
+                             postcode = {'postal_code', 'postcode', 'addr:postcode',
+                                         'tiger:zip_left', 'tiger:zip_right'},
+                             country = {'country_code', 'ISO3166-1',
+                                        'addr:country_code', 'is_in:country_code',
+                                        'addr:country', 'is_in:country'}
+                           }
+
+module.ADDRESS_TAGS.houses = { main = {'addr:housenumber',
+                                       'addr:conscriptionnumber',
+                                       'addr:streetnumber'},
+                               interpolation = {'addr:interpolation'}
+                             }
+
+-- Ignored tags (prefiltered away)
+
+module.IGNORE_KEYS = {}
+
+module.IGNORE_KEYS.metatags = {'note', 'note:*', 'source', 'source:*', '*source',
+                               'attribution', 'comment', 'fixme', 'created_by',
+                               'tiger:cfcc', 'tiger:reviewed', 'nysgissam:*',
+                               'NHD:*', 'nhd:*', 'gnis:*', 'geobase:*', 'yh:*',
+                               'osak:*', 'naptan:*', 'CLC:*', 'import', 'it:fvg:*',
+                               'lacounty:*', 'ref:linz:*',
+                               'ref:bygningsnr', 'ref:ruian:*', 'building:ruian:type',
+                               'type',
+                               'is_in:postcode'}
+module.IGNORE_KEYS.name = {'*:prefix', '*:suffix', 'name:prefix:*', 'name:suffix:*',
+                           'name:etymology', 'name:etymology:*',
+                           'name:signed', 'name:botanical'}
+module.IGNORE_KEYS.address = {'addr:street:*', 'addr:city:*', 'addr:district:*',
+                              'addr:province:*', 'addr:subdistrict:*', 'addr:place:*',
+                              'addr:TW:dataset'}
+
+-- Extra tags (prefiltered away)
+
+module.EXTRATAGS = {}
+
+module.EXTRATAGS.required = {'wikipedia', 'wikipedia:*', 'wikidata', 'capital'}
+
+return module
diff --git a/lib-lua/themes/nominatim/topics/address.lua b/lib-lua/themes/nominatim/topics/address.lua
new file mode 100644
index 00000000..0e813673
--- /dev/null
+++ b/lib-lua/themes/nominatim/topics/address.lua
@@ -0,0 +1,23 @@
+local _, flex, cfg = ...
+
+flex.set_main_tags('admin')
+flex.modify_main_tags('street/' .. (cfg.street_theme or 'default'))
+flex.modify_main_tags{boundary = {postal_code = 'always'}}
+
+flex.set_name_tags('core')
+flex.modify_name_tags('address')
+
+flex.set_address_tags('core')
+flex.modify_address_tags('houses')
+
+flex.ignore_keys('metatags')
+flex.add_for_extratags('required')
+
+if cfg.with_extratags then
+    flex.set_unused_handling{delete_keys = {'tiger:*'}}
+    flex.add_for_extratags('name')
+    flex.add_for_extratags('address')
+else
+    flex.ignore_keys('name')
+    flex.ignore_keys('address')
+end
diff --git a/lib-lua/themes/nominatim/topics/admin.lua b/lib-lua/themes/nominatim/topics/admin.lua
new file mode 100644
index 00000000..47f4e248
--- /dev/null
+++ b/lib-lua/themes/nominatim/topics/admin.lua
@@ -0,0 +1,20 @@
+local _, flex, cfg = ...
+
+flex.set_main_tags('admin')
+
+flex.set_name_tags('core')
+
+flex.set_address_tags('core')
+flex.set_postcode_fallback(false)
+
+flex.ignore_keys('metatags')
+flex.add_for_extratags('required')
+
+if cfg.with_extratags then
+    flex.set_unused_handling{delete_keys = {'tiger:*'}}
+    flex.add_for_extratags('name')
+    flex.add_for_extratags('address')
+else
+    flex.ignore_keys('name')
+    flex.ignore_keys('address')
+end
diff --git a/lib-lua/themes/nominatim/topics/full.lua b/lib-lua/themes/nominatim/topics/full.lua
new file mode 100644
index 00000000..a0b61b0f
--- /dev/null
+++ b/lib-lua/themes/nominatim/topics/full.lua
@@ -0,0 +1,32 @@
+local _, flex, cfg = ...
+
+local group
+if cfg.with_extratags then
+    group = 'extra'
+else
+    group = 'delete'
+end
+
+flex.set_main_tags('all_boundaries')
+flex.modify_main_tags('natural')
+flex.modify_main_tags('street/' .. (cfg.street_theme or 'default'))
+flex.modify_main_tags('poi/' .. group)
+
+flex.set_name_tags('core')
+flex.modify_name_tags('address')
+flex.modify_name_tags('poi')
+
+flex.set_address_tags('core')
+flex.modify_address_tags('houses')
+
+flex.ignore_keys('metatags')
+flex.add_for_extratags('required')
+
+if cfg.with_extratags then
+    flex.set_unused_handling{delete_keys = {'tiger:*'}}
+    flex.add_for_extratags('name')
+    flex.add_for_extratags('address')
+else
+    flex.ignore_keys('name')
+    flex.ignore_keys('address')
+end
diff --git a/lib-lua/themes/nominatim/topics/street.lua b/lib-lua/themes/nominatim/topics/street.lua
new file mode 100644
index 00000000..89bed442
--- /dev/null
+++ b/lib-lua/themes/nominatim/topics/street.lua
@@ -0,0 +1,22 @@
+local _, flex, cfg = ...
+
+flex.set_main_tags('admin')
+flex.modify_main_tags('street/' .. (cfg.street_theme or 'default'))
+flex.modify_main_tags{boundary = {postal_code = 'always'}}
+
+flex.set_name_tags('core')
+
+flex.set_address_tags('core')
+flex.set_postcode_fallback(false)
+
+flex.ignore_keys('metatags')
+flex.add_for_extratags('required')
+
+if cfg.with_extratags then
+    flex.set_unused_handling{delete_keys = {'tiger:*'}}
+    flex.add_for_extratags('name')
+    flex.add_for_extratags('address')
+else
+    flex.ignore_keys('name')
+    flex.ignore_keys('address')
+end
diff --git a/lib-sql/functions.sql b/lib-sql/functions.sql
index 158969d9..737a3f21 100644
--- a/lib-sql/functions.sql
+++ b/lib-sql/functions.sql
@@ -8,7 +8,6 @@
 {% include('functions/utils.sql') %}
 {% include('functions/ranking.sql') %}
 {% include('functions/importance.sql') %}
-{% include('functions/address_lookup.sql') %}
 {% include('functions/interpolation.sql') %}
 
 {% if 'place' in db.tables %}
diff --git a/lib-sql/functions/address_lookup.sql b/lib-sql/functions/address_lookup.sql
deleted file mode 100644
index cba11dbf..00000000
--- a/lib-sql/functions/address_lookup.sql
+++ /dev/null
@@ -1,334 +0,0 @@
--- SPDX-License-Identifier: GPL-2.0-only
---
--- This file is part of Nominatim. (https://nominatim.org)
---
--- Copyright (C) 2022 by the Nominatim developer community.
--- For a full list of authors see the git log.
-
--- Functions for returning address information for a place.
-
-DROP TYPE IF EXISTS addressline CASCADE;
-CREATE TYPE addressline as (
-  place_id BIGINT,
-  osm_type CHAR(1),
-  osm_id BIGINT,
-  name HSTORE,
-  class TEXT,
-  type TEXT,
-  place_type TEXT,
-  admin_level INTEGER,
-  fromarea BOOLEAN,
-  isaddress BOOLEAN,
-  rank_address INTEGER,
-  distance FLOAT
-);
-
-
-CREATE OR REPLACE FUNCTION get_name_by_language(name hstore, languagepref TEXT[])
-  RETURNS TEXT
-  AS $$
-DECLARE
-  result TEXT;
-BEGIN
-  IF name is null THEN
-    RETURN null;
-  END IF;
-
-  FOR j IN 1..array_upper(languagepref,1) LOOP
-    IF name ? languagepref[j] THEN
-      result := trim(name->languagepref[j]);
-      IF result != '' THEN
-        return result;
-      END IF;
-    END IF;
-  END LOOP;
-
-  -- as a fallback - take the last element since it is the default name
-  RETURN trim((avals(name))[array_length(avals(name), 1)]);
-END;
-$$
-LANGUAGE plpgsql IMMUTABLE;
-
-
---housenumber only needed for tiger data
-CREATE OR REPLACE FUNCTION get_address_by_language(for_place_id BIGINT,
-                                                   housenumber INTEGER,
-                                                   languagepref TEXT[])
-  RETURNS TEXT
-  AS $$
-DECLARE
-  result TEXT[];
-  currresult TEXT;
-  prevresult TEXT;
-  location RECORD;
-BEGIN
-
-  result := '{}';
-  prevresult := '';
-
-  FOR location IN
-    SELECT name,
-       CASE WHEN place_id = for_place_id THEN 99 ELSE rank_address END as rank_address
-    FROM get_addressdata(for_place_id, housenumber)
-    WHERE isaddress order by rank_address desc
-  LOOP
-    currresult := trim(get_name_by_language(location.name, languagepref));
-    IF currresult != prevresult AND currresult IS NOT NULL
-       AND result[(100 - location.rank_address)] IS NULL
-    THEN
-      result[(100 - location.rank_address)] := currresult;
-      prevresult := currresult;
-    END IF;
-  END LOOP;
-
-  RETURN array_to_string(result,', ');
-END;
-$$
-LANGUAGE plpgsql STABLE;
-
-DROP TYPE IF EXISTS addressdata_place;
-CREATE TYPE addressdata_place AS (
-  place_id BIGINT,
-  country_code VARCHAR(2),
-  housenumber TEXT,
-  postcode TEXT,
-  class TEXT,
-  type TEXT,
-  name HSTORE,
-  address HSTORE,
-  centroid GEOMETRY
-);
-
--- Compute the list of address parts for the given place.
---
--- If in_housenumber is greator or equal 0, look for an interpolation.
-CREATE OR REPLACE FUNCTION get_addressdata(in_place_id BIGINT, in_housenumber INTEGER)
-  RETURNS setof addressline
-  AS $$
-DECLARE
-  place addressdata_place;
-  location RECORD;
-  country RECORD;
-  current_rank_address INTEGER;
-  location_isaddress BOOLEAN;
-BEGIN
-  -- The place in question might not have a direct entry in place_addressline.
-  -- Look for the parent of such places then and save it in place.
-
-  -- first query osmline (interpolation lines)
-  IF in_housenumber >= 0 THEN
-    SELECT parent_place_id as place_id, country_code,
-           in_housenumber as housenumber, postcode,
-           'place' as class, 'house' as type,
-           null as name, null as address,
-           ST_Centroid(linegeo) as centroid
-      INTO place
-      FROM location_property_osmline
-      WHERE place_id = in_place_id
-            AND in_housenumber between startnumber and endnumber;
-  END IF;
-
-  --then query tiger data
-  {% if config.get_bool('USE_US_TIGER_DATA') %}
-  IF place IS NULL AND in_housenumber >= 0 THEN
-    SELECT parent_place_id as place_id, 'us' as country_code,
-           in_housenumber as housenumber, postcode,
-           'place' as class, 'house' as type,
-           null as name, null as address,
-           ST_Centroid(linegeo) as centroid
-      INTO place
-      FROM location_property_tiger
-      WHERE place_id = in_place_id
-            AND in_housenumber between startnumber and endnumber;
-  END IF;
-  {% endif %}
-
-  -- postcode table
-  IF place IS NULL THEN
-    SELECT parent_place_id as place_id, country_code,
-           null::text as housenumber, postcode,
-           'place' as class, 'postcode' as type,
-           null as name, null as address,
-           null as centroid
-      INTO place
-      FROM location_postcode
-      WHERE place_id = in_place_id;
-  END IF;
-
-  -- POI objects in the placex table
-  IF place IS NULL THEN
-    SELECT parent_place_id as place_id, country_code,
-           coalesce(address->'housenumber',
-                    address->'streetnumber',
-                    address->'conscriptionnumber')::text as housenumber,
-           postcode,
-           class, type,
-           name, address,
-           centroid
-      INTO place
-      FROM placex
-      WHERE place_id = in_place_id and rank_search > 27;
-  END IF;
-
-  -- If place is still NULL at this point then the object has its own
-  -- entry in place_address line. However, still check if there is not linked
-  -- place we should be using instead.
-  IF place IS NULL THEN
-    select coalesce(linked_place_id, place_id) as place_id,  country_code,
-           null::text as housenumber, postcode,
-           class, type,
-           null as name, address,
-           null as centroid
-      INTO place
-      FROM placex where place_id = in_place_id;
-  END IF;
-
---RAISE WARNING '% % % %',searchcountrycode, searchhousenumber, searchpostcode;
-
-  -- --- Return the record for the base entry.
-
-  current_rank_address := 1000;
-  FOR location IN
-    SELECT placex.place_id, osm_type, osm_id, name,
-           coalesce(extratags->'linked_place', extratags->'place') as place_type,
-           class, type, admin_level,
-           CASE WHEN rank_address = 0 THEN 100
-                WHEN rank_address = 11 THEN 5
-                ELSE rank_address END as rank_address,
-           country_code
-      FROM placex
-      WHERE place_id = place.place_id
-  LOOP
---RAISE WARNING '%',location;
-    -- mix in default names for countries
-    IF location.rank_address = 4 and place.country_code is not NULL THEN
-      FOR country IN
-        SELECT coalesce(name, ''::hstore) as name FROM country_name
-          WHERE country_code = place.country_code LIMIT 1
-      LOOP
-        place.name := country.name || place.name;
-      END LOOP;
-    END IF;
-
-    IF location.rank_address < 4 THEN
-      -- no country locations for ranks higher than country
-      place.country_code := NULL::varchar(2);
-    ELSEIF place.country_code IS NULL AND location.country_code IS NOT NULL THEN
-      place.country_code := location.country_code;
-    END IF;
-
-    RETURN NEXT ROW(location.place_id, location.osm_type, location.osm_id,
-                    location.name, location.class, location.type,
-                    location.place_type,
-                    location.admin_level, true,
-                    location.type not in ('postcode', 'postal_code'),
-                    location.rank_address, 0)::addressline;
-
-    current_rank_address := location.rank_address;
-  END LOOP;
-
-  -- --- Return records for address parts.
-
-  FOR location IN
-    SELECT placex.place_id, osm_type, osm_id, name, class, type,
-           coalesce(extratags->'linked_place', extratags->'place') as place_type,
-           admin_level, fromarea, isaddress and linked_place_id is NULL as isaddress,
-           CASE WHEN rank_address = 11 THEN 5 ELSE rank_address END as rank_address,
-           distance, country_code, postcode
-      FROM place_addressline join placex on (address_place_id = placex.place_id)
-      WHERE place_addressline.place_id IN (place.place_id, in_place_id)
-            AND linked_place_id is null
-            AND (placex.country_code IS NULL OR place.country_code IS NULL
-                 OR placex.country_code = place.country_code)
-      ORDER BY rank_address desc,
-               (place_addressline.place_id = in_place_id) desc,
-               (CASE WHEN coalesce((avals(name) && avals(place.address)), False) THEN 2
-                     WHEN isaddress THEN 0
-                     WHEN fromarea
-                          and place.centroid is not null
-                          and ST_Contains(geometry, place.centroid) THEN 1
-                     ELSE -1 END) desc,
-               fromarea desc, distance asc, rank_search desc
-  LOOP
-    -- RAISE WARNING '%',location;
-    location_isaddress := location.rank_address != current_rank_address;
-
-    IF place.country_code IS NULL AND location.country_code IS NOT NULL THEN
-      place.country_code := location.country_code;
-    END IF;
-    IF location.type in ('postcode', 'postal_code')
-       AND place.postcode is not null
-    THEN
-      -- If the place had a postcode assigned, take this one only
-      -- into consideration when it is an area and the place does not have
-      -- a postcode itself.
-      IF location.fromarea AND location_isaddress
-         AND (place.address is null or not place.address ? 'postcode')
-      THEN
-        place.postcode := null; -- remove the less exact postcode
-      ELSE
-        location_isaddress := false;
-      END IF;
-    END IF;
-    RETURN NEXT ROW(location.place_id, location.osm_type, location.osm_id,
-                    location.name, location.class, location.type,
-                    location.place_type,
-                    location.admin_level, location.fromarea,
-                    location_isaddress,
-                    location.rank_address,
-                    location.distance)::addressline;
-
-    current_rank_address := location.rank_address;
-  END LOOP;
-
-  -- If no country was included yet, add the name information from country_name.
-  IF current_rank_address > 4 THEN
-    FOR location IN
-      SELECT name || coalesce(derived_name, ''::hstore) as name FROM country_name
-        WHERE country_code = place.country_code LIMIT 1
-    LOOP
---RAISE WARNING '% % %',current_rank_address,searchcountrycode,countryname;
-      RETURN NEXT ROW(null, null, null, location.name, 'place', 'country', NULL,
-                      null, true, true, 4, 0)::addressline;
-    END LOOP;
-  END IF;
-
-  -- Finally add some artificial rows.
-  IF place.country_code IS NOT NULL THEN
-    location := ROW(null, null, null, hstore('ref', place.country_code),
-                    'place', 'country_code', null, null, true, false, 4, 0)::addressline;
-    RETURN NEXT location;
-  END IF;
-
-  IF place.name IS NOT NULL THEN
-    location := ROW(in_place_id, null, null, place.name, place.class,
-                    place.type, null, null, true, true, 29, 0)::addressline;
-    RETURN NEXT location;
-  END IF;
-
-  IF place.housenumber IS NOT NULL THEN
-    location := ROW(null, null, null, hstore('ref', place.housenumber),
-                    'place', 'house_number', null, null, true, true, 28, 0)::addressline;
-    RETURN NEXT location;
-  END IF;
-
-  IF place.address is not null and place.address ? '_unlisted_place' THEN
-    RETURN NEXT ROW(null, null, null, hstore('name', place.address->'_unlisted_place'),
-                    'place', 'locality', null, null, true, true, 25, 0)::addressline;
-  END IF;
-
-  IF place.postcode is not null THEN
-    location := ROW(null, null, null, hstore('ref', place.postcode), 'place',
-                    'postcode', null, null, false, true, 5, 0)::addressline;
-    RETURN NEXT location;
-  ELSEIF place.address is not null and place.address ? 'postcode'
-         and not place.address->'postcode' SIMILAR TO '%(,|;)%' THEN
-    location := ROW(null, null, null, hstore('ref', place.address->'postcode'), 'place',
-                    'postcode', null, null, false, true, 5, 0)::addressline;
-    RETURN NEXT location;
-  END IF;
-
-  RETURN;
-END;
-$$
-LANGUAGE plpgsql STABLE;
diff --git a/lib-sql/functions/importance.sql b/lib-sql/functions/importance.sql
index 1de5899c..4993d70b 100644
--- a/lib-sql/functions/importance.sql
+++ b/lib-sql/functions/importance.sql
@@ -65,7 +65,7 @@ BEGIN
   RETURN NULL;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 {% else %}
 
@@ -78,7 +78,7 @@ SELECT convert_from(CAST(E'\\x' || array_to_string(ARRAY(
     FROM regexp_matches($1, '%[0-9a-f][0-9a-f]|.', 'gi') AS r(m)
 ), '') AS bytea), 'UTF8');
 $$ 
-LANGUAGE SQL IMMUTABLE STRICT;
+LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION catch_decode_url_part(p varchar)
@@ -91,7 +91,7 @@ EXCEPTION
   WHEN others THEN return null;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE STRICT;
+LANGUAGE plpgsql IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION get_wikipedia_match(extratags HSTORE, country_code varchar(2))
@@ -139,7 +139,7 @@ BEGIN
   RETURN NULL;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 {% endif %}
 
@@ -203,5 +203,5 @@ BEGIN
   RETURN result;
 END;
 $$
-LANGUAGE plpgsql;
+LANGUAGE plpgsql PARALLEL SAFE;
 
diff --git a/lib-sql/functions/interpolation.sql b/lib-sql/functions/interpolation.sql
index 2fd21e8a..452ef7c3 100644
--- a/lib-sql/functions/interpolation.sql
+++ b/lib-sql/functions/interpolation.sql
@@ -34,7 +34,7 @@ BEGIN
   RETURN in_address;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 
@@ -70,7 +70,7 @@ BEGIN
   RETURN parent_place_id;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION reinsert_interpolation(way_id BIGINT, addr HSTORE,
diff --git a/lib-sql/functions/partition-functions.sql b/lib-sql/functions/partition-functions.sql
index 20ec3da6..d3c83615 100644
--- a/lib-sql/functions/partition-functions.sql
+++ b/lib-sql/functions/partition-functions.sql
@@ -17,28 +17,6 @@ CREATE TYPE nearfeaturecentr AS (
   centroid GEOMETRY
 );
 
--- feature intersects geometry
--- for areas and linestrings they must touch at least along a line
-CREATE OR REPLACE FUNCTION is_relevant_geometry(de9im TEXT, geom_type TEXT)
-RETURNS BOOLEAN
-AS $$
-BEGIN
-  IF substring(de9im from 1 for 2) != 'FF' THEN
-    RETURN TRUE;
-  END IF;
-
-  IF geom_type = 'ST_Point' THEN
-    RETURN substring(de9im from 4 for 1) = '0';
-  END IF;
-
-  IF geom_type in ('ST_LineString', 'ST_MultiLineString') THEN
-    RETURN substring(de9im from 4 for 1) = '1';
-  END IF;
-
-  RETURN substring(de9im from 4 for 1) = '2';
-END
-$$ LANGUAGE plpgsql IMMUTABLE;
-
 CREATE OR REPLACE function getNearFeatures(in_partition INTEGER, feature GEOMETRY,
                                            feature_centroid GEOMETRY,
                                            maxrank INTEGER)
@@ -59,7 +37,12 @@ BEGIN
              isguess, postcode, centroid
       FROM location_area_large_{{ partition }}
       WHERE geometry && feature
-        AND is_relevant_geometry(ST_Relate(geometry, feature), ST_GeometryType(feature))
+        AND CASE WHEN ST_Dimension(feature) = 0
+                     THEN _ST_Covers(geometry, feature)
+                 WHEN ST_Dimension(feature) = 2
+                     THEN ST_Relate(geometry, feature, 'T********')
+                 ELSE ST_NPoints(ST_Intersection(geometry, feature)) > 1
+            END
         AND rank_address < maxrank
             -- Postcodes currently still use rank_search to define for which
             -- features they are relevant.
@@ -75,7 +58,7 @@ BEGIN
   RAISE EXCEPTION 'Unknown partition %', in_partition;
 END
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION get_address_place(in_partition SMALLINT, feature GEOMETRY,
@@ -104,7 +87,7 @@ BEGIN
   RAISE EXCEPTION 'Unknown partition %', in_partition;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 create or replace function deleteLocationArea(in_partition INTEGER, in_place_id BIGINT, in_rank_search INTEGER) RETURNS BOOLEAN AS $$
@@ -142,14 +125,16 @@ BEGIN
 
   IF in_rank_search <= 4 and not in_estimate THEN
     INSERT INTO location_area_country (place_id, country_code, geometry)
-      values (in_place_id, in_country_code, in_geometry);
+      (SELECT in_place_id, in_country_code, geom
+       FROM split_geometry(in_geometry) as geom);
     RETURN TRUE;
   END IF;
 
 {% for partition in db.partitions %}
   IF in_partition = {{ partition }} THEN
     INSERT INTO location_area_large_{{ partition }} (partition, place_id, country_code, keywords, rank_search, rank_address, isguess, postcode, centroid, geometry)
-      values (in_partition, in_place_id, in_country_code, in_keywords, in_rank_search, in_rank_address, in_estimate, postcode, in_centroid, in_geometry);
+      (SELECT in_partition, in_place_id, in_country_code, in_keywords, in_rank_search, in_rank_address, in_estimate, postcode, in_centroid, geom
+       FROM split_geometry(in_geometry) as geom);
     RETURN TRUE;
   END IF;
 {% endfor %}
@@ -187,7 +172,7 @@ BEGIN
   RAISE EXCEPTION 'Unknown partition %', in_partition;
 END
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 CREATE OR REPLACE FUNCTION getNearestNamedPlacePlaceId(in_partition INTEGER,
                                                        point GEOMETRY,
@@ -217,7 +202,7 @@ BEGIN
   RAISE EXCEPTION 'Unknown partition %', in_partition;
 END
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 create or replace function insertSearchName(
   in_partition INTEGER, in_place_id BIGINT, in_name_vector INTEGER[],
@@ -325,7 +310,7 @@ BEGIN
   RAISE EXCEPTION 'Unknown partition %', in_partition;
 END
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 CREATE OR REPLACE FUNCTION getNearestParallelRoadFeature(in_partition INTEGER,
                                                          line GEOMETRY)
@@ -369,4 +354,4 @@ BEGIN
   RAISE EXCEPTION 'Unknown partition %', in_partition;
 END
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
diff --git a/lib-sql/functions/placex_triggers.sql b/lib-sql/functions/placex_triggers.sql
index 9d0d73b5..8524ffc3 100644
--- a/lib-sql/functions/placex_triggers.sql
+++ b/lib-sql/functions/placex_triggers.sql
@@ -109,7 +109,7 @@ BEGIN
   RETURN result;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION find_associated_street(poi_osm_type CHAR(1),
@@ -200,7 +200,7 @@ BEGIN
   RETURN result;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 -- Find the parent road of a POI.
@@ -286,7 +286,7 @@ BEGIN
   RETURN parent_place_id;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 -- Try to find a linked place for the given object.
 CREATE OR REPLACE FUNCTION find_linked_place(bnd placex)
@@ -404,7 +404,7 @@ BEGIN
   RETURN NULL;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION create_poi_search_terms(obj_place_id BIGINT,
diff --git a/lib-sql/functions/ranking.sql b/lib-sql/functions/ranking.sql
index 97a0cde3..c16ad1db 100644
--- a/lib-sql/functions/ranking.sql
+++ b/lib-sql/functions/ranking.sql
@@ -29,7 +29,7 @@ BEGIN
   RETURN 0.02;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 -- Return an approximate update radius according to the search rank.
@@ -60,7 +60,7 @@ BEGIN
   RETURN 0;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 -- Compute a base address rank from the extent of the given geometry.
 --
@@ -107,7 +107,7 @@ BEGIN
    RETURN 23;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 -- Guess a ranking for postcodes from country and postcode format.
@@ -167,7 +167,7 @@ BEGIN
 
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 -- Get standard search and address rank for an object.
@@ -236,7 +236,7 @@ BEGIN
   END IF;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 CREATE OR REPLACE FUNCTION get_addr_tag_rank(key TEXT, country TEXT,
                                              OUT from_rank SMALLINT,
@@ -283,7 +283,7 @@ BEGIN
   END LOOP;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION weigh_search(search_vector INT[],
@@ -304,4 +304,4 @@ BEGIN
   RETURN def_weight;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
diff --git a/lib-sql/functions/utils.sql b/lib-sql/functions/utils.sql
index df00f916..30f94080 100644
--- a/lib-sql/functions/utils.sql
+++ b/lib-sql/functions/utils.sql
@@ -24,7 +24,7 @@ BEGIN
   RETURN ST_PointOnSurface(place);
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION geometry_sector(partition INTEGER, place GEOMETRY)
@@ -34,7 +34,7 @@ BEGIN
   RETURN (partition*1000000) + (500-ST_X(place)::INTEGER)*1000 + (500-ST_Y(place)::INTEGER);
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 
@@ -60,7 +60,7 @@ BEGIN
   RETURN r;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 -- Return the node members with a given label from a relation member list
 -- as a set.
@@ -88,7 +88,7 @@ BEGIN
   RETURN;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION get_rel_node_members(members JSONB, memberLabels TEXT[])
@@ -107,7 +107,7 @@ BEGIN
   RETURN;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 -- Copy 'name' to or from the default language.
@@ -136,7 +136,7 @@ BEGIN
   END IF;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 -- Find the nearest artificial postcode for the given geometry.
@@ -172,7 +172,7 @@ BEGIN
     RETURN outcode;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION get_country_code(place geometry)
@@ -233,7 +233,7 @@ BEGIN
   RETURN NULL;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION get_country_language_code(search_country_code VARCHAR(2))
@@ -251,7 +251,7 @@ BEGIN
   RETURN NULL;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION get_partition(in_country_code VARCHAR(10))
@@ -268,7 +268,7 @@ BEGIN
   RETURN 0;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 -- Find the parent of an address with addr:street/addr:place tag.
@@ -299,7 +299,7 @@ BEGIN
   RETURN parent_place_id;
 END;
 $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql STABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION delete_location(OLD_place_id BIGINT)
@@ -337,7 +337,7 @@ BEGIN
                      ST_Project(geom::geography, radius, 3.9269908)::geometry));
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION add_location(place_id BIGINT, country_code varchar(2),
@@ -348,8 +348,6 @@ CREATE OR REPLACE FUNCTION add_location(place_id BIGINT, country_code varchar(2)
   RETURNS BOOLEAN
   AS $$
 DECLARE
-  locationid INTEGER;
-  secgeo GEOMETRY;
   postcode TEXT;
 BEGIN
   PERFORM deleteLocationArea(partition, place_id, rank_search);
@@ -360,18 +358,19 @@ BEGIN
       postcode := upper(trim (in_postcode));
   END IF;
 
-  IF ST_GeometryType(geometry) in ('ST_Polygon','ST_MultiPolygon') THEN
-    FOR secgeo IN select split_geometry(geometry) AS geom LOOP
-      PERFORM insertLocationAreaLarge(partition, place_id, country_code, keywords, rank_search, rank_address, false, postcode, centroid, secgeo);
-    END LOOP;
-
-  ELSEIF ST_GeometryType(geometry) = 'ST_Point' THEN
-    secgeo := place_node_fuzzy_area(geometry, rank_search);
-    PERFORM insertLocationAreaLarge(partition, place_id, country_code, keywords, rank_search, rank_address, true, postcode, centroid, secgeo);
+  IF ST_Dimension(geometry) = 2 THEN
+    RETURN insertLocationAreaLarge(partition, place_id, country_code, keywords,
+                                   rank_search, rank_address, false, postcode,
+                                   centroid, geometry);
+  END IF;
 
+  IF ST_Dimension(geometry) = 0 THEN
+    RETURN insertLocationAreaLarge(partition, place_id, country_code, keywords,
+                                   rank_search, rank_address, true, postcode,
+                                   centroid, place_node_fuzzy_area(geometry, rank_search));
   END IF;
 
-  RETURN true;
+  RETURN false;
 END;
 $$
 LANGUAGE plpgsql;
@@ -394,19 +393,21 @@ DECLARE
   geo RECORD;
   area FLOAT;
   remainingdepth INTEGER;
-  added INTEGER;
 BEGIN
-
 --  RAISE WARNING 'quad_split_geometry: maxarea=%, depth=%',maxarea,maxdepth;
 
-  IF (ST_GeometryType(geometry) not in ('ST_Polygon','ST_MultiPolygon') OR NOT ST_IsValid(geometry)) THEN
+  IF not ST_IsValid(geometry) THEN
+    RETURN;
+  END IF;
+
+  IF ST_Dimension(geometry) != 2 OR maxdepth <= 1 THEN
     RETURN NEXT geometry;
     RETURN;
   END IF;
 
   remainingdepth := maxdepth - 1;
   area := ST_AREA(geometry);
-  IF remainingdepth < 1 OR area < maxarea THEN
+  IF area < maxarea THEN
     RETURN NEXT geometry;
     RETURN;
   END IF;
@@ -426,7 +427,6 @@ BEGIN
   xmid := (xmin+xmax)/2;
   ymid := (ymin+ymax)/2;
 
-  added := 0;
   FOR seg IN 1..4 LOOP
 
     IF seg = 1 THEN
@@ -442,23 +442,20 @@ BEGIN
       secbox := ST_SetSRID(ST_MakeBox2D(ST_Point(xmid,ymid),ST_Point(xmax,ymax)),4326);
     END IF;
 
-    IF st_intersects(geometry, secbox) THEN
-      secgeo := st_intersection(geometry, secbox);
-      IF NOT ST_IsEmpty(secgeo) AND ST_GeometryType(secgeo) in ('ST_Polygon','ST_MultiPolygon') THEN
-        FOR geo IN select quad_split_geometry(secgeo, maxarea, remainingdepth) as geom LOOP
-          IF NOT ST_IsEmpty(geo.geom) AND ST_GeometryType(geo.geom) in ('ST_Polygon','ST_MultiPolygon') THEN
-            added := added + 1;
-            RETURN NEXT geo.geom;
-          END IF;
-        END LOOP;
-      END IF;
+    secgeo := st_intersection(geometry, secbox);
+    IF NOT ST_IsEmpty(secgeo) AND ST_Dimension(secgeo) = 2 THEN
+      FOR geo IN SELECT quad_split_geometry(secgeo, maxarea, remainingdepth) as geom LOOP
+        IF NOT ST_IsEmpty(geo.geom) AND ST_Dimension(geo.geom) = 2 THEN
+          RETURN NEXT geo.geom;
+        END IF;
+      END LOOP;
     END IF;
   END LOOP;
 
   RETURN;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION split_geometry(geometry GEOMETRY)
@@ -467,14 +464,26 @@ CREATE OR REPLACE FUNCTION split_geometry(geometry GEOMETRY)
 DECLARE
   geo RECORD;
 BEGIN
-  -- 10000000000 is ~~ 1x1 degree
-  FOR geo IN select quad_split_geometry(geometry, 0.25, 20) as geom LOOP
-    RETURN NEXT geo.geom;
-  END LOOP;
+  IF ST_GeometryType(geometry) = 'ST_MultiPolygon'
+     and ST_Area(geometry) * 10 > ST_Area(Box2D(geometry))
+  THEN
+    FOR geo IN
+        SELECT quad_split_geometry(g, 0.25, 20) as geom
+        FROM (SELECT (ST_Dump(geometry)).geom::geometry(Polygon, 4326) AS g) xx
+    LOOP
+      RETURN NEXT geo.geom;
+    END LOOP;
+  ELSE
+    FOR geo IN
+        SELECT quad_split_geometry(geometry, 0.25, 20) as geom
+    LOOP
+      RETURN NEXT geo.geom;
+    END LOOP;
+  END IF;
   RETURN;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 CREATE OR REPLACE FUNCTION simplify_large_polygons(geometry GEOMETRY)
   RETURNS GEOMETRY
@@ -488,7 +497,7 @@ BEGIN
   RETURN geometry;
 END;
 $$
-LANGUAGE plpgsql IMMUTABLE;
+LANGUAGE plpgsql IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION place_force_delete(placeid BIGINT)
diff --git a/lib-sql/tokenizer/icu_tokenizer.sql b/lib-sql/tokenizer/icu_tokenizer.sql
index 04fcedcb..8cf13120 100644
--- a/lib-sql/tokenizer/icu_tokenizer.sql
+++ b/lib-sql/tokenizer/icu_tokenizer.sql
@@ -12,7 +12,7 @@ CREATE OR REPLACE FUNCTION token_get_name_search_tokens(info JSONB)
   RETURNS INTEGER[]
 AS $$
   SELECT (info->>'names')::INTEGER[]
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 -- Get tokens for matching the place name against others.
@@ -22,7 +22,7 @@ CREATE OR REPLACE FUNCTION token_get_name_match_tokens(info JSONB)
   RETURNS INTEGER[]
 AS $$
   SELECT (info->>'names')::INTEGER[]
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 -- Return the housenumber tokens applicable for the place.
@@ -30,7 +30,7 @@ CREATE OR REPLACE FUNCTION token_get_housenumber_search_tokens(info JSONB)
   RETURNS INTEGER[]
 AS $$
   SELECT (info->>'hnr_tokens')::INTEGER[]
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 -- Return the housenumber in the form that it can be matched during search.
@@ -38,77 +38,77 @@ CREATE OR REPLACE FUNCTION token_normalized_housenumber(info JSONB)
   RETURNS TEXT
 AS $$
   SELECT info->>'hnr';
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_is_street_address(info JSONB)
   RETURNS BOOLEAN
 AS $$
   SELECT info->>'street' is not null or info->>'place' is null;
-$$ LANGUAGE SQL IMMUTABLE;
+$$ LANGUAGE SQL IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_has_addr_street(info JSONB)
   RETURNS BOOLEAN
 AS $$
   SELECT info->>'street' is not null and info->>'street' != '{}';
-$$ LANGUAGE SQL IMMUTABLE;
+$$ LANGUAGE SQL IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_has_addr_place(info JSONB)
   RETURNS BOOLEAN
 AS $$
   SELECT info->>'place' is not null;
-$$ LANGUAGE SQL IMMUTABLE;
+$$ LANGUAGE SQL IMMUTABLE PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_matches_street(info JSONB, street_tokens INTEGER[])
   RETURNS BOOLEAN
 AS $$
   SELECT (info->>'street')::INTEGER[] && street_tokens
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_matches_place(info JSONB, place_tokens INTEGER[])
   RETURNS BOOLEAN
 AS $$
   SELECT (info->>'place')::INTEGER[] <@ place_tokens
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_addr_place_search_tokens(info JSONB)
   RETURNS INTEGER[]
 AS $$
   SELECT (info->>'place')::INTEGER[]
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_get_address_keys(info JSONB)
   RETURNS SETOF TEXT
 AS $$
   SELECT * FROM jsonb_object_keys(info->'addr');
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_get_address_search_tokens(info JSONB, key TEXT)
   RETURNS INTEGER[]
 AS $$
   SELECT (info->'addr'->>key)::INTEGER[];
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_matches_address(info JSONB, key TEXT, tokens INTEGER[])
   RETURNS BOOLEAN
 AS $$
   SELECT (info->'addr'->>key)::INTEGER[] <@ tokens;
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 CREATE OR REPLACE FUNCTION token_get_postcode(info JSONB)
   RETURNS TEXT
 AS $$
   SELECT info->>'postcode';
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 
 -- Return token info that should be saved permanently in the database.
@@ -116,7 +116,7 @@ CREATE OR REPLACE FUNCTION token_strip_info(info JSONB)
   RETURNS JSONB
 AS $$
   SELECT NULL::JSONB;
-$$ LANGUAGE SQL IMMUTABLE STRICT;
+$$ LANGUAGE SQL IMMUTABLE STRICT PARALLEL SAFE;
 
 --------------- private functions ----------------------------------------------
 
@@ -128,16 +128,14 @@ DECLARE
   partial_terms TEXT[] = '{}'::TEXT[];
   term TEXT;
   term_id INTEGER;
-  term_count INTEGER;
 BEGIN
   SELECT min(word_id) INTO full_token
     FROM word WHERE word = norm_term and type = 'W';
 
   IF full_token IS NULL THEN
     full_token := nextval('seq_word');
-    INSERT INTO word (word_id, word_token, type, word, info)
-      SELECT full_token, lookup_term, 'W', norm_term,
-             json_build_object('count', 0)
+    INSERT INTO word (word_id, word_token, type, word)
+      SELECT full_token, lookup_term, 'W', norm_term
         FROM unnest(lookup_terms) as lookup_term;
   END IF;
 
@@ -150,14 +148,67 @@ BEGIN
 
   partial_tokens := '{}'::INT[];
   FOR term IN SELECT unnest(partial_terms) LOOP
-    SELECT min(word_id), max(info->>'count') INTO term_id, term_count
+    SELECT min(word_id) INTO term_id
+      FROM word WHERE word_token = term and type = 'w';
+
+    IF term_id IS NULL THEN
+      term_id := nextval('seq_word');
+      INSERT INTO word (word_id, word_token, type)
+        VALUES (term_id, term, 'w');
+    END IF;
+
+    partial_tokens := array_merge(partial_tokens, ARRAY[term_id]);
+  END LOOP;
+END;
+$$
+LANGUAGE plpgsql;
+
+
+CREATE OR REPLACE FUNCTION getorcreate_full_word(norm_term TEXT,
+                                                 lookup_terms TEXT[],
+                                                 lookup_norm_terms TEXT[],
+                                                 OUT full_token INT,
+                                                 OUT partial_tokens INT[])
+  AS $$
+DECLARE
+  partial_terms TEXT[] = '{}'::TEXT[];
+  term TEXT;
+  term_id INTEGER;
+BEGIN
+  SELECT min(word_id) INTO full_token
+    FROM word WHERE word = norm_term and type = 'W';
+
+  IF full_token IS NULL THEN
+    full_token := nextval('seq_word');
+    IF lookup_norm_terms IS NULL THEN
+      INSERT INTO word (word_id, word_token, type, word)
+        SELECT full_token, lookup_term, 'W', norm_term
+          FROM unnest(lookup_terms) as lookup_term;
+    ELSE
+      INSERT INTO word (word_id, word_token, type, word, info)
+        SELECT full_token, t.lookup, 'W', norm_term,
+               CASE WHEN norm_term = t.norm THEN null
+               ELSE json_build_object('lookup', t.norm) END
+          FROM unnest(lookup_terms, lookup_norm_terms) as t(lookup, norm);
+    END IF;
+  END IF;
+
+  FOR term IN SELECT unnest(string_to_array(unnest(lookup_terms), ' ')) LOOP
+    term := trim(term);
+    IF NOT (ARRAY[term] <@ partial_terms) THEN
+      partial_terms := partial_terms || term;
+    END IF;
+  END LOOP;
+
+  partial_tokens := '{}'::INT[];
+  FOR term IN SELECT unnest(partial_terms) LOOP
+    SELECT min(word_id) INTO term_id
       FROM word WHERE word_token = term and type = 'w';
 
     IF term_id IS NULL THEN
       term_id := nextval('seq_word');
-      term_count := 0;
-      INSERT INTO word (word_id, word_token, type, info)
-        VALUES (term_id, term, 'w', json_build_object('count', term_count));
+      INSERT INTO word (word_id, word_token, type)
+        VALUES (term_id, term, 'w');
     END IF;
 
     partial_tokens := array_merge(partial_tokens, ARRAY[term_id]);
diff --git a/nominatim-cli.py b/nominatim-cli.py
index 1f3c1210..7a1aadb8 100755
--- a/nominatim-cli.py
+++ b/nominatim-cli.py
@@ -3,7 +3,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Helper script for development to run nominatim from the source directory.
@@ -15,4 +15,4 @@ sys.path.insert(1, str((Path(__file__) / '..' / 'src').resolve()))
 
 from nominatim_db import cli
 
-exit(cli.nominatim(module_dir=None, osm2pgsql_path=None))
+exit(cli.nominatim())
diff --git a/packaging/nominatim-api/extra_src/paths.py b/packaging/nominatim-api/extra_src/paths.py
index 797acbb5..7d186da1 100644
--- a/packaging/nominatim-api/extra_src/paths.py
+++ b/packaging/nominatim-api/extra_src/paths.py
@@ -11,4 +11,5 @@ from pathlib import Path
 
 DATA_DIR = None
 SQLLIB_DIR = None
+LUALIB_DIR = None
 CONFIG_DIR = (Path(__file__) / '..' / 'resources' / 'settings').resolve()
diff --git a/packaging/nominatim-api/pyproject.toml b/packaging/nominatim-api/pyproject.toml
index d4ea8d8c..e467e8ac 100644
--- a/packaging/nominatim-api/pyproject.toml
+++ b/packaging/nominatim-api/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "nominatim-api"
-version = "4.5.0.post6"
+version = "5.1.0.post7"
 description = "A tool for building a database of OpenStreetMap for geocoding and for searching the database. Search library."
 readme = "README.md"
 requires-python = ">=3.7"
@@ -16,13 +16,9 @@ classifiers = [
     "Operating System :: OS Independent",
 ]
 dependencies = [
-    "python-dotenv==1.0.1",
-    "pyYAML==6.0.2",
-    "SQLAlchemy==2.0.36",
-    "psycopg[binary]==3.2.3",
-    "PyICU==2.14",
+    "SQLAlchemy==2.0.41",
     "falcon==4.0.2",
-    "uvicorn==0.32.0",
+    "uvicorn==0.34.2",
     "gunicorn==23.0.0"
 ]
 
diff --git a/packaging/nominatim-db/extra_src/nominatim_db/paths.py b/packaging/nominatim-db/extra_src/nominatim_db/paths.py
index 796ff08b..02df5047 100644
--- a/packaging/nominatim-db/extra_src/nominatim_db/paths.py
+++ b/packaging/nominatim-db/extra_src/nominatim_db/paths.py
@@ -11,4 +11,5 @@ from pathlib import Path
 
 DATA_DIR = (Path(__file__) / '..' / 'resources').resolve()
 SQLLIB_DIR = (DATA_DIR / 'lib-sql')
+LUALIB_DIR = (DATA_DIR / 'lib-lua')
 CONFIG_DIR = (DATA_DIR / 'settings')
diff --git a/packaging/nominatim-db/lib-lua b/packaging/nominatim-db/lib-lua
new file mode 120000
index 00000000..e4e1bd04
--- /dev/null
+++ b/packaging/nominatim-db/lib-lua
@@ -0,0 +1 @@
+../../lib-lua
\ No newline at end of file
diff --git a/packaging/nominatim-db/pyproject.toml b/packaging/nominatim-db/pyproject.toml
index 17065eb6..a695f28d 100644
--- a/packaging/nominatim-db/pyproject.toml
+++ b/packaging/nominatim-db/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "nominatim-db"
-version = "4.5.0.post6"
+version = "5.1.0.post7"
 description = "A tool for building a database of OpenStreetMap for geocoding and for searching the database. Database backend."
 readme = "README.md"
 requires-python = ">=3.7"
@@ -16,13 +16,12 @@ classifiers = [
     "Operating System :: OS Independent",
 ]
 dependencies = [
-    "psycopg[binary]==3.2.3",
-    "python-dotenv==1.0.1",
-    "jinja2==3.1.4",
+    "psycopg[binary]==3.2.9",
+    "python-dotenv==1.1.0",
+    "jinja2==3.1.6",
     "pyYAML==6.0.2",
-    "datrie==0.8.2",
-    "psutil==6.1.0",
-    "PyICU==2.14",
+    "psutil==7.0.0",
+    "PyICU==2.15.2",
     "osmium==4.0.2",
 ]
 
@@ -45,6 +44,7 @@ include = [
     "src/nominatim_db",
     "scripts",
     "lib-sql/**/*.sql",
+    "lib-lua/**/*.lua",
     "settings",
     "data/words.sql",
     "extra_src/nominatim_db/paths.py"
@@ -66,6 +66,7 @@ packages = ["src/nominatim_db"]
 
 [tool.hatch.build.targets.wheel.force-include]
 "lib-sql" = "nominatim_db/resources/lib-sql"
+"lib-lua" = "nominatim_db/resources/lib-lua"
 "settings" = "nominatim_db/resources/settings"
 "data/country_osm_grid.sql.gz" = "nominatim_db/resources/country_osm_grid.sql.gz"
 "data/words.sql" = "nominatim_db/resources/words.sql"
diff --git a/packaging/nominatim-db/scripts/nominatim b/packaging/nominatim-db/scripts/nominatim
index 184ab4c6..bc384b02 100755
--- a/packaging/nominatim-db/scripts/nominatim
+++ b/packaging/nominatim-db/scripts/nominatim
@@ -2,4 +2,4 @@
 
 from nominatim_db import cli
 
-exit(cli.nominatim(osm2pgsql_path=None))
+exit(cli.nominatim())
diff --git a/settings/address-levels.json b/settings/address-levels.json
index b63eac4e..1b1ef7e7 100644
--- a/settings/address-levels.json
+++ b/settings/address-levels.json
@@ -23,8 +23,8 @@
           "allotments" : 22,
           "neighbourhood" : [20, 22],
           "quarter" : [20, 22],
-          "isolated_dwelling" : [22, 20],
-          "farm" : [22, 20],
+          "isolated_dwelling" : [22, 25],
+          "farm" : [22, 25],
           "city_block" : 25,
           "mountain_pass" : 25,
           "square" : 25,
@@ -74,6 +74,14 @@
           "stone" : 30,
           "" : [22, 0]
       },
+      "water" : {
+          "lake" : [20, 0],
+          "reservoir" : [20, 0],
+          "wastewater" : [24, 0],
+          "pond" : [24, 0],
+          "fountain" : [24, 0],
+          "" : [22, 0]
+      },
       "waterway" : {
           "river" : [19, 0],
           "stream" : [22, 0],
@@ -208,6 +216,14 @@
       }
   }
 },
+{ "countries" : ["sa"],
+  "tags" : {
+      "place" : {
+          "province" : 12,
+          "municipality" : 18
+      }
+  }
+},
 { "countries" : ["sk"],
   "tags" : {
       "boundary" : {
diff --git a/settings/country_settings.yaml b/settings/country_settings.yaml
index 667684c6..88ace911 100644
--- a/settings/country_settings.yaml
+++ b/settings/country_settings.yaml
@@ -944,7 +944,7 @@ kp:
 # South Korea (ëíë¯¼êµ­)
 kr:
     partition: 49
-    languages: ko, en
+    languages: ko
     names: !include country-names/kr.yaml
     postcode:
       pattern: "ddddd"
@@ -1809,7 +1809,8 @@ us:
     languages: en
     names: !include country-names/us.yaml
     postcode:
-      pattern: "ddddd"
+      pattern: "(ddddd)(?:-dddd)?"
+      output: \1
 
 
 # Uruguay (Uruguay)
diff --git a/settings/env.defaults b/settings/env.defaults
index b8c66667..3ebb288f 100644
--- a/settings/env.defaults
+++ b/settings/env.defaults
@@ -192,6 +192,13 @@ NOMINATIM_REQUEST_TIMEOUT=60
 # to geocode" instead.
 NOMINATIM_SEARCH_WITHIN_COUNTRIES=False
 
+# Specifies the order in which different name tags are used.
+# The values in this list determine the preferred order of name variants,
+# including language-specific names.
+# Comma-separated list, where :XX stands for language-specific tags
+# (e.g. name:en) and no :XX stands for general tags (e.g. name).
+NOMINATIM_OUTPUT_NAMES=name:XX,name,brand,official_name:XX,short_name:XX,official_name,short_name,ref
+
 ### Log settings
 #
 # The following options allow to enable logging of API requests.
diff --git a/settings/flex-base.lua b/settings/flex-base.lua
deleted file mode 100644
index 7860737f..00000000
--- a/settings/flex-base.lua
+++ /dev/null
@@ -1,557 +0,0 @@
--- Core functions for Nominatim import flex style.
---
-
-local module = {}
-
-local PRE_DELETE = nil
-local PRE_EXTRAS = nil
-local POST_DELETE = nil
-local MAIN_KEYS = nil
-local NAMES = nil
-local ADDRESS_TAGS = nil
-local SAVE_EXTRA_MAINS = false
-local POSTCODE_FALLBACK = true
-
--- tables required for taginfo
-module.TAGINFO_MAIN = {keys = {}, delete_tags = {}}
-module.TAGINFO_NAME_KEYS = {}
-module.TAGINFO_ADDRESS_KEYS = {}
-
-
--- The single place table.
-local place_table = osm2pgsql.define_table{
-    name = "place",
-    ids = { type = 'any', id_column = 'osm_id', type_column = 'osm_type' },
-    columns = {
-        { column = 'class', type = 'text', not_null = true },
-        { column = 'type', type = 'text', not_null = true },
-        { column = 'admin_level', type = 'smallint' },
-        { column = 'name', type = 'hstore' },
-        { column = 'address', type = 'hstore' },
-        { column = 'extratags', type = 'hstore' },
-        { column = 'geometry', type = 'geometry', projection = 'WGS84', not_null = true },
-    },
-    data_tablespace = os.getenv("NOMINATIM_TABLESPACE_PLACE_DATA"),
-    index_tablespace = os.getenv("NOMINATIM_TABLESPACE_PLACE_INDEX"),
-    indexes = {}
-}
-
------------- Geometry functions for relations ---------------------
-
-function module.relation_as_multipolygon(o)
-    return o:as_multipolygon()
-end
-
-function module.relation_as_multiline(o)
-    return o:as_multilinestring():line_merge()
-end
-
-
-module.RELATION_TYPES = {
-    multipolygon = module.relation_as_multipolygon,
-    boundary = module.relation_as_multipolygon,
-    waterway = module.relation_as_multiline
-}
-
-------------- Place class ------------------------------------------
-
-local Place = {}
-Place.__index = Place
-
-function Place.new(object, geom_func)
-    local self = setmetatable({}, Place)
-    self.object = object
-    self.geom_func = geom_func
-
-    self.admin_level = tonumber(self.object:grab_tag('admin_level'))
-    if self.admin_level == nil
-       or self.admin_level <= 0 or self.admin_level > 15
-       or math.floor(self.admin_level) ~= self.admin_level then
-        self.admin_level = 15
-    end
-
-    self.num_entries = 0
-    self.has_name = false
-    self.names = {}
-    self.address = {}
-    self.extratags = {}
-
-    return self
-end
-
-function Place:clean(data)
-    for k, v in pairs(self.object.tags) do
-        if data.delete ~= nil and data.delete(k, v) then
-            self.object.tags[k] = nil
-        elseif data.extra ~= nil and data.extra(k, v) then
-            self.extratags[k] = v
-            self.object.tags[k] = nil
-        end
-    end
-end
-
-function Place:delete(data)
-    if data.match ~= nil then
-        for k, v in pairs(self.object.tags) do
-            if data.match(k, v) then
-                self.object.tags[k] = nil
-            end
-        end
-    end
-end
-
-function Place:grab_extratags(data)
-    local count = 0
-
-    if data.match ~= nil then
-        for k, v in pairs(self.object.tags) do
-            if data.match(k, v) then
-                self.object.tags[k] = nil
-                self.extratags[k] = v
-                count = count + 1
-            end
-        end
-    end
-
-    return count
-end
-
-local function strip_address_prefix(k)
-    if k:sub(1, 5) == 'addr:' then
-        return k:sub(6)
-    end
-
-    if k:sub(1, 6) == 'is_in:' then
-        return k:sub(7)
-    end
-
-    return k
-end
-
-
-function Place:grab_address_parts(data)
-    local count = 0
-
-    if data.groups ~= nil then
-        for k, v in pairs(self.object.tags) do
-            local atype = data.groups(k, v)
-
-            if atype ~= nil then
-                if atype == 'main' then
-                    self.has_name = true
-                    self.address[strip_address_prefix(k)] = v
-                    count = count + 1
-                elseif atype == 'extra' then
-                    self.address[strip_address_prefix(k)] = v
-                else
-                    self.address[atype] = v
-                end
-                self.object.tags[k] = nil
-            end
-        end
-    end
-
-    return count
-end
-
-
-function Place:grab_name_parts(data)
-    local fallback = nil
-
-    if data.groups ~= nil then
-        for k, v in pairs(self.object.tags) do
-            local atype = data.groups(k, v)
-
-            if atype ~= nil then
-                self.names[k] = v
-                self.object.tags[k] = nil
-                if atype == 'main' then
-                    self.has_name = true
-                elseif atype == 'house' then
-                    self.has_name = true
-                    fallback = {'place', 'house', 'always'}
-                end
-            end
-        end
-    end
-
-    return fallback
-end
-
-
-function Place:write_place(k, v, mtype, save_extra_mains)
-    if mtype == nil then
-        return 0
-    end
-
-    v = v or self.object.tags[k]
-    if v == nil then
-        return 0
-    end
-
-    if type(mtype) == 'table' then
-        mtype = mtype[v] or mtype[1]
-    end
-
-    if mtype == 'always' or (self.has_name and mtype == 'named') then
-        return self:write_row(k, v, save_extra_mains)
-    end
-
-    if mtype == 'named_with_key' then
-        local names = {}
-        local prefix = k .. ':name'
-        for namek, namev in pairs(self.object.tags) do
-            if namek:sub(1, #prefix) == prefix
-               and (#namek == #prefix
-                    or namek:sub(#prefix + 1, #prefix + 1) == ':') then
-                names[namek:sub(#k + 2)] = namev
-            end
-        end
-
-        if next(names) ~= nil then
-            local saved_names = self.names
-            self.names = names
-
-            local results = self:write_row(k, v, save_extra_mains)
-
-            self.names = saved_names
-
-            return results
-        end
-    end
-
-    return 0
-end
-
-function Place:write_row(k, v, save_extra_mains)
-    if self.geometry == nil then
-        self.geometry = self.geom_func(self.object)
-    end
-    if self.geometry == nil or self.geometry:is_null() then
-        return 0
-    end
-
-    if save_extra_mains ~= nil then
-        for extra_k, extra_v in pairs(self.object.tags) do
-            if extra_k ~= k and save_extra_mains(extra_k, extra_v) then
-                self.extratags[extra_k] = extra_v
-            end
-        end
-    end
-
-    place_table:insert{
-        class = k,
-        type = v,
-        admin_level = self.admin_level,
-        name = next(self.names) and self.names,
-        address = next(self.address) and self.address,
-        extratags = next(self.extratags) and self.extratags,
-        geometry = self.geometry
-    }
-
-    if save_extra_mains then
-        for tk, tv in pairs(self.object.tags) do
-            if save_extra_mains(tk, tv) then
-                self.extratags[tk] = nil
-            end
-        end
-    end
-
-    self.num_entries = self.num_entries + 1
-
-    return 1
-end
-
-
-function module.tag_match(data)
-    if data == nil or next(data) == nil then
-        return nil
-    end
-
-    local fullmatches = {}
-    local key_prefixes = {}
-    local key_suffixes = {}
-
-    if data.keys ~= nil then
-        for _, key in pairs(data.keys) do
-            if key:sub(1, 1) == '*' then
-                if #key > 1 then
-                    if key_suffixes[#key - 1] == nil then
-                        key_suffixes[#key - 1] = {}
-                    end
-                    key_suffixes[#key - 1][key:sub(2)] = true
-                end
-            elseif key:sub(#key, #key) == '*' then
-                if key_prefixes[#key - 1] == nil then
-                    key_prefixes[#key - 1] = {}
-                end
-                key_prefixes[#key - 1][key:sub(1, #key - 1)] = true
-            else
-                fullmatches[key] = true
-            end
-        end
-    end
-
-    if data.tags ~= nil then
-        for k, vlist in pairs(data.tags) do
-            if fullmatches[k] == nil then
-                fullmatches[k] = {}
-                for _, v in pairs(vlist) do
-                    fullmatches[k][v] = true
-                end
-            end
-        end
-    end
-
-    return function (k, v)
-        if fullmatches[k] ~= nil and (fullmatches[k] == true or fullmatches[k][v] ~= nil) then
-            return true
-        end
-
-        for slen, slist in pairs(key_suffixes) do
-            if #k >= slen and slist[k:sub(-slen)] ~= nil then
-                return true
-            end
-        end
-
-        for slen, slist in pairs(key_prefixes) do
-            if #k >= slen and slist[k:sub(1, slen)] ~= nil then
-                return true
-            end
-        end
-
-        return false
-    end
-end
-
-
-function module.tag_group(data)
-    if data == nil or next(data) == nil then
-        return nil
-    end
-
-    local fullmatches = {}
-    local key_prefixes = {}
-    local key_suffixes = {}
-
-    for group, tags in pairs(data) do
-        for _, key in pairs(tags) do
-            if key:sub(1, 1) == '*' then
-                if #key > 1 then
-                    if key_suffixes[#key - 1] == nil then
-                        key_suffixes[#key - 1] = {}
-                    end
-                    key_suffixes[#key - 1][key:sub(2)] = group
-                end
-            elseif key:sub(#key, #key) == '*' then
-                if key_prefixes[#key - 1] == nil then
-                    key_prefixes[#key - 1] = {}
-                end
-                key_prefixes[#key - 1][key:sub(1, #key - 1)] = group
-            else
-                fullmatches[key] = group
-            end
-        end
-    end
-
-    return function (k, v)
-        local val = fullmatches[k]
-        if val ~= nil then
-            return val
-        end
-
-        for slen, slist in pairs(key_suffixes) do
-            if #k >= slen then
-                val = slist[k:sub(-slen)]
-                if val ~= nil then
-                    return val
-                end
-            end
-        end
-
-        for slen, slist in pairs(key_prefixes) do
-            if #k >= slen then
-                val = slist[k:sub(1, slen)]
-                if val ~= nil then
-                    return val
-                end
-            end
-        end
-    end
-end
-
--- Returns prefix part of the keys, and reject suffix matching keys
-local function process_key(key)
-    if key:sub(1, 1) == '*' then
-        return nil
-    end
-    if key:sub(#key, #key) == '*' then
-        return key:sub(1, #key - 2)
-    end
-    return key
-end
-
--- Process functions for all data types
-function module.process_node(object)
-
-    local function geom_func(o)
-        return o:as_point()
-    end
-
-    module.process_tags(Place.new(object, geom_func))
-end
-
-function module.process_way(object)
-
-    local function geom_func(o)
-        local geom = o:as_polygon()
-
-        if geom:is_null() then
-            geom = o:as_linestring()
-            if not geom:is_null() and geom:length() > 30 then
-              return nil
-            end
-        end
-
-        return geom
-    end
-
-    module.process_tags(Place.new(object, geom_func))
-end
-
-function module.process_relation(object)
-    local geom_func = module.RELATION_TYPES[object.tags.type]
-
-    if geom_func ~= nil then
-        module.process_tags(Place.new(object, geom_func))
-    end
-end
-
--- The process functions are used by default by osm2pgsql.
-osm2pgsql.process_node = module.process_node
-osm2pgsql.process_way = module.process_way
-osm2pgsql.process_relation = module.process_relation
-
-function module.process_tags(o)
-    o:clean{delete = PRE_DELETE, extra = PRE_EXTRAS}
-
-    -- Exception for boundary/place double tagging
-    if o.object.tags.boundary == 'administrative' then
-        o:grab_extratags{match = function (k, v)
-            return k == 'place' and v:sub(1,3) ~= 'isl'
-        end}
-    end
-
-    -- name keys
-    local fallback = o:grab_name_parts{groups=NAMES}
-
-    -- address keys
-    if o:grab_address_parts{groups=ADDRESS_TAGS} > 0 and fallback == nil then
-        fallback = {'place', 'house', 'always'}
-    end
-    if o.address.country ~= nil and #o.address.country ~= 2 then
-        o.address['country'] = nil
-    end
-    if POSTCODE_FALLBACK and fallback == nil and o.address.postcode ~= nil then
-        fallback = {'place', 'postcode', 'always'}
-    end
-
-    if o.address.interpolation ~= nil then
-        o:write_place('place', 'houses', 'always', SAVE_EXTRA_MAINS)
-        return
-    end
-
-    o:clean{delete = POST_DELETE}
-
-    -- collect main keys
-    for k, v in pairs(o.object.tags) do
-        local ktype = MAIN_KEYS[k]
-        if ktype == 'fallback' then
-            if o.has_name then
-                fallback = {k, v, 'named'}
-            end
-        elseif ktype ~= nil then
-            o:write_place(k, v, MAIN_KEYS[k], SAVE_EXTRA_MAINS)
-        end
-    end
-
-    if fallback ~= nil and o.num_entries == 0 then
-        o:write_place(fallback[1], fallback[2], fallback[3], SAVE_EXTRA_MAINS)
-    end
-end
-
---------- Convenience functions for simple style configuration -----------------
-
-
-function module.set_prefilters(data)
-    PRE_DELETE = module.tag_match{keys = data.delete_keys, tags = data.delete_tags}
-    PRE_EXTRAS = module.tag_match{keys = data.extra_keys,
-                                  tags = data.extra_tags}
-    module.TAGINFO_MAIN.delete_tags = data.delete_tags
-end
-
-function module.set_main_tags(data)
-    MAIN_KEYS = data
-    local keys = {}
-    for k, _ in pairs(data) do
-        table.insert(keys, k)
-    end
-    module.TAGINFO_MAIN.keys = keys
-end
-
-function module.set_name_tags(data)
-    NAMES = module.tag_group(data)
-
-    for _, lst in pairs(data) do
-        for _, k in ipairs(lst) do
-            local key = process_key(k)
-            if key ~= nil then
-                module.TAGINFO_NAME_KEYS[key] = true
-            end
-        end
-    end
-end
-
-function module.set_address_tags(data)
-    if data.postcode_fallback ~= nil then
-        POSTCODE_FALLBACK = data.postcode_fallback
-        data.postcode_fallback = nil
-    end
-    ADDRESS_TAGS = module.tag_group(data)
-
-    for _, lst in pairs(data) do
-        if lst ~= nil then
-            for _, k in ipairs(lst) do
-                local key = process_key(k)
-                if key ~= nil then
-                    module.TAGINFO_ADDRESS_KEYS[key] = true
-                end
-            end
-        end
-    end
-end
-
-function module.set_unused_handling(data)
-    if data.extra_keys == nil and data.extra_tags == nil then
-        POST_DELETE = module.tag_match{keys = data.delete_keys, tags = data.delete_tags}
-        SAVE_EXTRA_MAINS = function() return true end
-    elseif data.delete_keys == nil and data.delete_tags == nil then
-        POST_DELETE = nil
-        SAVE_EXTRA_MAINS = module.tag_match{keys = data.extra_keys, tags = data.extra_tags}
-    else
-        error("unused handler can have only 'extra_keys' or 'delete_keys' set.")
-    end
-end
-
-function module.set_relation_types(data)
-    module.RELATION_TYPES = {}
-    for k, v in data do
-        if v == 'multipolygon' then
-            module.RELATION_TYPES[k] = module.relation_as_multipolygon
-        elseif v == 'multiline' then
-            module.RELATION_TYPES[k] = module.relation_as_multiline
-        end
-    end
-end
-
-return module
diff --git a/settings/icu-rules/variants-ca.yaml b/settings/icu-rules/variants-ca.yaml
index fab36dec..943ead51 100644
--- a/settings/icu-rules/variants-ca.yaml
+++ b/settings/icu-rules/variants-ca.yaml
@@ -4,7 +4,7 @@
     -  aparcament -> aparc
     -  apartament -> apmt
     -  apartat -> apt
-    - Ã tic -> Ã t
+    -  Ã tic -> Ã t
     -  autopista -> auto
     -  autopista -> autop
     -  autovia -> autov
@@ -19,7 +19,6 @@
     -  biblioteca -> bibl
     -  bloc -> bl
     -  carrer -> c
-    -  carrer -> c/
     -  carrerÃ³ -> crÃ³
     -  carretera -> ctra
     -  cantonada -> cant
@@ -58,7 +57,6 @@
     -  nÃºmero -> n
     -  sense nÃºmero -> s/n
     -  parada -> par
-    -  parcelÂ·la -> parc
     -  passadÃ­s -> pdÃ­s
     -  passatge -> ptge
     -  passeig -> pg
diff --git a/settings/icu-rules/variants-en.yaml b/settings/icu-rules/variants-en.yaml
index 5508fcd1..54a7b475 100644
--- a/settings/icu-rules/variants-en.yaml
+++ b/settings/icu-rules/variants-en.yaml
@@ -1,438 +1,393 @@
 # Source: https://wiki.openstreetmap.org/wiki/Name_finder:Abbreviations#English
+# Source: https://pe.usps.com/text/pub28/28apc_002.htm
 - lang: en
   words:
     -  Access -> Accs
     -  Air Force Base -> AFB
     -  Air National Guard Base -> ANGB
     -  Airport -> Aprt
-    -  Alley -> Al
-    -  Alley -> All
-    -  Alley -> Ally
-    -  Alley -> Aly
+    -  Alley -> Al,All,Ally,Aly
     -  Alleyway -> Alwy
     -  Amble -> Ambl
+    -  Anex -> Anx
     -  Apartments -> Apts
-    -  Approach -> Apch
-    -  Approach -> App
+    -  Approach -> Apch,App
     -  Arcade -> Arc
     -  Arterial -> Artl
     -  Artery -> Arty
-    -  Avenue -> Av
-    -  Avenue -> Ave
+    -  Avenue -> Av,Ave
     -  Back -> Bk
     -  Banan -> Ba
-    -  Basin -> Basn
-    -  Basin -> Bsn
+    -  Basin -> Basn,Bsn
+    -  Bayou -> Byu
     -  Beach -> Bch
-    -  Bend -> Bend
     -  Bend -> Bnd
     -  Block -> Blk
+    -  Bluff -> Blf
+    -  Bluffs -> Blfs
     -  Boardwalk -> Bwlk
-    -  Boulevard -> Blvd
-    -  Boulevard -> Bvd
+    -  Bottom -> Btm
+    -  Boulevard -> Blvd,Bvd
     -  Boundary -> Bdy
     -  Bowl -> Bl
     -  Brace -> Br
     -  Brae -> Br
-    -  Brae -> Brae
+    -  Branch -> Br
     -  Break -> Brk
-    -  Bridge -> Bdge
-    -  Bridge -> Br
-    -  Bridge -> Brdg
-    -  Bridge -> Bri
-    -  Broadway -> Bdwy
-    -  Broadway -> Bway
-    -  Broadway -> Bwy
+    -  Bridge$ -> Bdge,Br,Brdg,Brg,Bri
+    -  Broadway -> Bdwy,Bway,Bwy
     -  Brook -> Brk
+    -  Brooks -> Brks
     -  Brow -> Brw
-    -  Brow -> Brow
-    -  Buildings -> Bldgs
-    -  Buildings -> Bldngs
+    -  Buildings -> Bldgs,Bldngs
     -  Business -> Bus
-    -  Bypass -> Bps
-    -  Bypass -> Byp
-    -  Bypass -> Bypa
+    -  Burg -> Bg
+    -  Burgs -> Bgs
+    -  Bypass -> Bps,Byp,Bypa
     -  Byway -> Bywy
+    -  Camp -> Cp
+    -  Canyon -> Cyn
+    -  Cape -> Cpe
     -  Caravan -> Cvn
-    -  Causeway -> Caus
-    -  Causeway -> Cswy
-    -  Causeway -> Cway
-    -  Center -> Cen
-    -  Center -> Ctr
+    -  Causeway -> Caus,Cswy,Cway
+    -  Center,Centre -> Cen,Ctr
+    -  Centers -> Ctrs
     -  Central -> Ctrl
-    -  Centre -> Cen
-    -  Centre -> Ctr
     -  Centreway -> Cnwy
     -  Chase -> Ch
     -  Church -> Ch
     -  Circle -> Cir
-    -  Circuit -> Cct
-    -  Circuit -> Ci
-    -  Circus -> Crc
-    -  Circus -> Crcs
+    -  Circles -> Cirs
+    -  Circuit -> Cct,Ci
+    -  Circus -> Crc,Crcs
     -  City -> Cty
+    -  Cliff -> Clf
+    -  Cliffs -> Clfs
     -  Close -> Cl
-    -  Common -> Cmn
-    -  Common -> Comm
+    -  Club -> Clb
+    -  Common -> Cmn,Comm
+    -  Commons -> Cmns
     -  Community -> Comm
     -  Concourse -> Cnc
     -  Concourse -> Con
     -  Copse -> Cps
-    -  Corner -> Cnr
-    -  Corner -> Crn
+    -  Corner -> Cor,Cnr,Crn
+    -  Corners -> Cors
     -  Corso -> Cso
     -  Cottages -> Cotts
     -  County -> Co
     -  County Road -> CR
     -  County Route -> CR
-    -  Court -> Crt
-    -  Court -> Ct
+    -  Course -> Crse
+    -  Court -> Crt,Ct
+    -  Courts -> Cts
     -  Courtyard -> Cyd
     -  Courtyard -> Ctyd
-    -  Cove -> Ce
-    -  Cove -> Cov
-    -  Cove -> Cove
-    -  Cove -> Cv
-    -  Creek -> Ck
-    -  Creek -> Cr
-    -  Creek -> Crk
+    -  Cove$ -> Ce,Cov,Cv
+    -  Coves -> Cvs
+    -  Creek$ -> Ck,Cr,Crk
     -  Crescent -> Cr
     -  Crescent -> Cres
-    -  Crest -> Crst
-    -  Crest -> Cst
+    -  Crest -> Crst,Cst
     -  Croft -> Cft
-    -  Cross -> Cs
-    -  Cross -> Crss
-    -  Crossing -> Crsg
-    -  Crossing -> Csg
-    -  Crossing -> Xing
-    -  Crossroad -> Crd
+    -  Cross -> Cs,Crss
+    -  Crossing -> Crsg,Csg,Xing
+    -  Crossroad -> Crd,Xrd
+    -  Crossroads -> Xrds
     -  Crossway -> Cowy
-    -  Cul-de-sac -> Cds
-    -  Cul-de-sac -> Csac
-    -  Curve -> Cve
+    -  Cul-de-sac -> Cds,Csac
+    -  Curve -> Cve,Curv
     -  Cutting -> Cutt
     -  Dale -> Dle
-    -  Dale -> Dale
+    -  Dam -> Dm
     -  Deviation -> Devn
-    -  Dip -> Dip
     -  Distributor -> Dstr
+    -  Divide -> Dv
     -  Down -> Dn
     -  Downs -> Dn
-    -  Drive -> Dr
-    -  Drive -> Drv
-    -  Drive -> Dv
+    -  Drive -> Dr,Drv,Dv
+    -  Drives -> Drs
     -  Drive-In => Drive-In # prevent abbreviation here
-    -  Driveway -> Drwy
-    -  Driveway -> Dvwy
-    -  Driveway -> Dwy
+    -  Driveway -> Drwy,Dvwy,Dwy
     -  East -> E
     -  Edge -> Edg
-    -  Edge -> Edge
     -  Elbow -> Elb
-    -  End -> End
     -  Entrance -> Ent
     -  Esplanade -> Esp
     -  Estate -> Est
-    -  Expressway -> Exp
-    -  Expressway -> Expy
-    -  Expressway -> Expwy
-    -  Expressway -> Xway
+    -  Estates -> Ests
+    -  Expressway -> Exp,Expy,Expwy,Xway
     -  Extension -> Ex
-    -  Fairway -> Fawy
-    -  Fairway -> Fy
+    -  Extensions -> Exts
+    -  Fairway -> Fawy,Fy
+    -  Falls -> Fls
     -  Father -> Fr
-    -  Ferry -> Fy
-    -  Field -> Fd
+    -  Ferry -> Fy,Fry
+    -  Field -> Fd,Fld
+    -  Fields -> Flds
     -  Fire Track -> Ftrk
     -  Firetrail -> Fit
-    -  Flat -> Fl
-    -  Flat -> Flat
+    -  Flat -> Fl,Flt
+    -  Flats -> Flts
     -  Follow -> Folw
     -  Footway -> Ftwy
+    -  Ford -> Frd
+    -  Fords -> Frds
     -  Foreshore -> Fshr
+    -  Forest -> Frst
     -  Forest Service Road -> FSR
+    -  Forge -> Frg
+    -  Forges -> Frgs
     -  Formation -> Form
+    -  Fork -> Frk
+    -  Forks -> Frks
     -  Fort -> Ft
-    -  Freeway -> Frwy
-    -  Freeway -> Fwy
+    -  Freeway -> Frwy,Fwy
     -  Front -> Frnt
-    -  Frontage -> Fr
-    -  Frontage -> Frtg
-    -  Gap -> Gap
+    -  Frontage -> Fr,Frtg
     -  Garden -> Gdn
-    -  Gardens -> Gdn
-    -  Gardens -> Gdns
-    -  Gate -> Ga
-    -  Gate -> Gte
-    -  Gates -> Ga
-    -  Gates -> Gte
-    -  Gateway -> Gwy
+    -  Gardens -> Gdn,Gdns
+    -  Gate,Gates -> Ga,Gte
+    -  Gateway -> Gwy,Gtwy
     -  George -> Geo
-    -  Glade -> Gl
-    -  Glade -> Gld
-    -  Glade -> Glde
+    -  Glade$ -> Gl,Gld,Glde
     -  Glen -> Gln
-    -  Glen -> Glen
+    -  Glens -> Glns
     -  Grange -> Gra
-    -  Green -> Gn
-    -  Green -> Grn
+    -  Green -> Gn,Grn
+    -  Greens -> Grns
     -  Ground -> Grnd
-    -  Grove -> Gr
-    -  Grove -> Gro
+    -  Grove$ -> Gr,Gro,Grv
+    -  Groves -> Grvs
     -  Grovet -> Gr
     -  Gully -> Gly
-    -  Harbor -> Hbr
-    -  Harbour -> Hbr
+    -  Harbor -> Hbr,Harbour
+    -  Harbors -> Hbrs
+    -  Harbour -> Hbr,Harbor
     -  Haven -> Hvn
     -  Head -> Hd
     -  Heads -> Hd
-    -  Heights -> Hgts
-    -  Heights -> Ht
-    -  Heights -> Hts
+    -  Heights -> Hgts,Ht,Hts
     -  High School -> HS
-    -  Highroad -> Hird
-    -  Highroad -> Hrd
+    -  Highroad -> Hird,Hrd
     -  Highway -> Hwy
-    -  Hill -> Hill
     -  Hill -> Hl
-    -  Hills -> Hl
-    -  Hills -> Hls
+    -  Hills -> Hl,Hls
+    -  Hollow -> Holw
     -  Hospital -> Hosp
-    -  House -> Ho
-    -  House -> Hse
+    -  House -> Ho,Hse
     -  Industrial -> Ind
+    -  Inlet -> Inlt
     -  Interchange -> Intg
     -  International -> Intl
-    -  Island -> I
-    -  Island -> Is
-    -  Junction -> Jctn
-    -  Junction -> Jnc
+    -  Island -> I,Is
+    -  Islands -> Iss
+    -  Junction -> Jct,Jctn,Jnc
+    -  Junctions -> Jcts
     -  Junior -> Jr
-    -  Key -> Key
+    -  Key -> Ky
+    -  Keys -> Kys
+    -  Knoll -> Knl
+    -  Knolls -> Knls
     -  Lagoon -> Lgn
-    -  Lakes -> L
-    -  Landing -> Ldg
-    -  Lane -> La
-    -  Lane -> Lane
-    -  Lane -> Ln
+    -  Lake -> Lk
+    -  Lakes -> L,Lks
+    -  Landing -> Ldg,Lndg
+    -  Lane -> La,Ln
     -  Laneway -> Lnwy
-    -  Line -> Line
+    -  Light -> Lgt
+    -  Lights -> Lgts
     -  Line -> Ln
-    -  Link -> Link
     -  Link -> Lk
-    -  Little -> Lit
-    -  Little -> Lt
+    -  Little -> Lit,Lt
+    -  Loaf -> Lf
+    -  Lock -> Lck
+    -  Locks -> Lcks
     -  Lodge -> Ldg
     -  Lookout -> Lkt
-    -  Loop -> Loop
     -  Loop -> Lp
-    -  Lower -> Low
-    -  Lower -> Lr
-    -  Lower -> Lwr
-    -  Mall -> Mall
+    -  Lower -> Low,Lr,Lwr
     -  Mall -> Ml
     -  Manor -> Mnr
+    -  Manors -> Mnrs
     -  Mansions -> Mans
     -  Market -> Mkt
     -  Meadow -> Mdw
-    -  Meadows -> Mdw
-    -  Meadows -> Mdws
+    -  Meadows -> Mdw,Mdws
     -  Mead -> Md
-    -  Meander -> Mdr
-    -  Meander -> Mndr
-    -  Meander -> Mr
+    -  Meander -> Mdr,Mndr,Mr
     -  Medical -> Med
     -  Memorial -> Mem
-    -  Mews -> Mews
     -  Mews -> Mw
     -  Middle -> Mid
     -  Middle School -> MS
     -  Mile -> Mi
     -  Military -> Mil
-    -  Motorway -> Mtwy
-    -  Motorway -> Mwy
+    -  Mill -> Ml
+    -  Mills -> Mls
+    -  Mission -> Msn
+    -  Motorway -> Mtwy,Mwy
     -  Mount -> Mt
     -  Mountain -> Mtn
-    -  Mountains -> Mtn
+    -  Mountains$ -> Mtn,Mtns
     -  Municipal -> Mun
     -  Museum -> Mus
     -  National Park -> NP
     -  National Recreation Area -> NRA
     -  National Wildlife Refuge Area -> NWRA
+    -  Neck -> Nck
     -  Nook -> Nk
-    -  Nook -> Nook
     -  North -> N
     -  Northeast -> NE
     -  Northwest -> NW
-    -  Outlook -> Out
-    -  Outlook -> Otlk
+    -  Orchard -> Orch
+    -  Outlook -> Out,Otlk
+    -  Overpass -> Opas
     -  Parade -> Pde
     -  Paradise -> Pdse
-    -  Park -> Park
     -  Park -> Pk
     -  Parklands -> Pkld
-    -  Parkway -> Pkwy
-    -  Parkway -> Pky
-    -  Parkway -> Pwy
-    -  Pass -> Pass
+    -  Parkway -> Pkwy,Pky,Pwy
+    -  Parkways -> Pkwy
     -  Pass -> Ps
     -  Passage -> Psge
-    -  Path -> Path
-    -  Pathway -> Phwy
-    -  Pathway -> Pway
-    -  Pathway -> Pwy
+    -  Pathway -> Phwy,Pway,Pwy
     -  Piazza -> Piaz
     -  Pike -> Pk
+    -  Pine -> Pne
+    -  Pines -> Pnes
     -  Place -> Pl
-    -  Plain -> Pl
-    -  Plains -> Pl
+    -  Plain -> Pl,Pln
+    -  Plains -> Pl,Plns
     -  Plateau -> Plat
-    -  Plaza -> Pl
-    -  Plaza -> Plz
-    -  Plaza -> Plza
+    -  Plaza -> Pl,Plz,Plza
     -  Pocket -> Pkt
-    -  Point -> Pnt
-    -  Point -> Pt
-    -  Port -> Port
-    -  Port -> Pt
+    -  Point -> Pnt,Pt
+    -  Points -> Pts
+    -  Port -> Prt,Pt
+    -  Ports -> Prts
     -  Post Office -> PO
+    -  Prairie -> Pr
     -  Precinct -> Pct
-    -  Promenade -> Prm
-    -  Promenade -> Prom
-    -  Quad -> Quad
+    -  Promenade -> Prm,Prom
     -  Quadrangle -> Qdgl
-    -  Quadrant -> Qdrt
-    -  Quadrant -> Qd
+    -  Quadrant -> Qdrt,Qd
     -  Quay -> Qy
     -  Quays -> Qy
     -  Quays -> Qys
+    -  Radial -> Radl
     -  Ramble -> Ra
     -  Ramble -> Rmbl
-    -  Range -> Rge
-    -  Range -> Rnge
+    -  Ranch -> Rnch
+    -  Range -> Rge,Rnge
+    -  Rapid -> Rpd
+    -  Rapids -> Rpds
     -  Reach -> Rch
     -  Reservation -> Res
     -  Reserve -> Res
     -  Reservoir -> Res
-    -  Rest -> Rest
     -  Rest -> Rst
-    -  Retreat -> Rt
-    -  Retreat -> Rtt
+    -  Retreat -> Rt,Rtt
     -  Return -> Rtn
-    -  Ridge -> Rdg
-    -  Ridge -> Rdge
+    -  Ridge -> Rdg,Rdge
+    -  Ridges -> Rdgs
     -  Ridgeway -> Rgwy
     -  Right of Way -> Rowy
     -  Rise -> Ri
-    -  Rise -> Rise
-    -  River -> R
-    -  River -> Riv
-    -  River -> Rvr
+    -  ^River -> R,Riv,Rvr
+    -  River$ -> R,Riv,Rvr
     -  Riverway -> Rvwy
     -  Riviera -> Rvra
     -  Road -> Rd
     -  Roads -> Rds
     -  Roadside -> Rdsd
-    -  Roadway -> Rdwy
-    -  Roadway -> Rdy
-    -  Robert -> Robt
+    -  Roadway -> Rdwy,Rdy
     -  Rocks -> Rks
     -  Ronde -> Rnde
     -  Rosebowl -> Rsbl
     -  Rotary -> Rty
     -  Round -> Rnd
-    -  Route -> Rt
-    -  Route -> Rte
-    -  Row -> Row
-    -  Rue -> Rue
-    -  Run -> Run
+    -  Route -> Rt,Rte
     -  Saint -> St
     -  Saints -> SS
     -  Senior -> Sr
-    -  Serviceway -> Swy
-    -  Serviceway -> Svwy
+    -  Serviceway -> Swy,Svwy
+    -  Shoal -> Shl
+    -  Shore -> Shr
+    -  Shores -> Shrs
     -  Shunt -> Shun
     -  Siding -> Sdng
     -  Sister -> Sr
+    -  Skyway -> Skwy
     -  Slope -> Slpe
     -  Sound -> Snd
-    -  South -> S
-    -  South -> Sth
+    -  South -> S,Sth
     -  Southeast -> SE
     -  Southwest -> SW
-    -  Spur -> Spur
+    -  Spring -> Spg
+    -  Springs -> Spgs
+    -  Spurs -> Spur
     -  Square -> Sq
+    -  Squares -> Sqs
     -  Stairway -> Strwy
-    -  State Highway -> SH
-    -  State Highway -> SHwy
+    -  State Highway -> SH,SHwy
     -  State Route -> SR
-    -  Station -> Sta
-    -  Station -> Stn
-    -  Strand -> Sd
-    -  Strand -> Stra
+    -  Station -> Sta,Stn
+    -  Strand -> Sd,Stra
+    -  Stravenue -> Stra
+    -  Stream -> Strm
     -  Street -> St
+    -  Streets -> Sts
     -  Strip -> Strp
     -  Subway -> Sbwy
+    -  Summit -> Smt
     -  Tarn -> Tn
-    -  Tarn -> Tarn
     -  Terminal -> Term
-    -  Terrace -> Tce
-    -  Terrace -> Ter
-    -  Terrace -> Terr
-    -  Thoroughfare -> Thfr
-    -  Thoroughfare -> Thor
-    -  Tollway -> Tlwy
-    -  Tollway -> Twy
-    -  Top -> Top
-    -  Tor -> Tor
+    -  Terrace -> Tce,Ter,Terr
+    -  Thoroughfare -> Thfr,Thor
+    -  Throughway -> Trwy
+    -  Tollway -> Tlwy,Twy
     -  Towers -> Twrs
     -  Township -> Twp
     -  Trace -> Trce
-    -  Track -> Tr
-    -  Track -> Trk
+    -  Track -> Tr,Trak,Trk
+    -  Trafficway -> Trfy
     -  Trail -> Trl
     -  Trailer -> Trlr
     -  Triangle -> Tri
     -  Trunkway -> Tkwy
-    -  Tunnel -> Tun
-    -  Turn -> Tn
-    -  Turn -> Trn
-    -  Turn -> Turn
-    -  Turnpike -> Tpk
-    -  Turnpike -> Tpke
-    -  Underpass -> Upas
-    -  Underpass -> Ups
-    -  University -> Uni
-    -  University -> Univ
+    -  Tunnel -> Tun,Tunl
+    -  Turn -> Tn,Trn
+    -  Turnpike -> Tpk,Tpke
+    -  Underpass -> Upas,Ups
+    -  Union -> Un
+    -  Unions -> Uns
+    -  University -> Uni,Univ
     -  Upper -> Up
     -  Upper -> Upr
     -  Vale -> Va
-    -  Vale -> Vale
+    -  Valley -> Vly
     -  Valley -> Vy
-    -  Viaduct -> Vdct
-    -  Viaduct -> Via
-    -  Viaduct -> Viad
+    -  Valleys -> Vlys
+    -  Viaduct$ -> Vdct,Via,Viad
     -  View -> Vw
-    -  View -> View
-    -  Village -> Vill
+    -  Views -> Vws
+    -  Village -> Vill,Vlg
+    -  Villages -> Vlgs
     -  Villas -> Vlls
-    -  Vista -> Vst
-    -  Vista -> Vsta
-    -  Walk -> Walk
-    -  Walk -> Wk
-    -  Walk -> Wlk
-    -  Walkway -> Wkwy
-    -  Walkway -> Wky
+    -  Ville -> Vl
+    -  Vista -> Vis,Vst,Vsta
+    -  Walk -> Wk,Wlk
+    -  Walks -> Walk
+    -  Walkway -> Wkwy,Wky
     -  Waters -> Wtr
-    -  Way -> Way
     -  Way -> Wy
+    -  Well -> Wl
+    -  Wells -> Wls
     -  West -> W
     -  Wharf -> Whrf
     -  William -> Wm
     -  Wynd -> Wyn
-    -  Wynd -> Wynd
-    -  Yard -> Yard
     -  Yard -> Yd
 - lang: en
   country: ca
diff --git a/settings/icu-rules/variants-es.yaml b/settings/icu-rules/variants-es.yaml
index 5c5e6abe..fbe40b54 100644
--- a/settings/icu-rules/variants-es.yaml
+++ b/settings/icu-rules/variants-es.yaml
@@ -30,7 +30,6 @@
     -  Bloque -> Blq
     -  Bulevar -> Blvr
     -  Boulevard -> Blvd
-    -  Calle -> C/
     -  Calle -> C
     -  Calle -> Cl
     -  Calleja -> Cllja
diff --git a/settings/icu-rules/variants-fr.yaml b/settings/icu-rules/variants-fr.yaml
index 0fd9c337..b9cfc493 100644
--- a/settings/icu-rules/variants-fr.yaml
+++ b/settings/icu-rules/variants-fr.yaml
@@ -3,20 +3,16 @@
   words:
     -  Abbaye -> ABE
     -  AgglomÃ©ration -> AGL
-    -  Aire -> AIRE
     -  Aires -> AIRE
     -  AllÃ©e -> ALL
-    -  AllÃ©e -> All
     -  AllÃ©es -> ALL
     -  Ancien chemin -> ACH
     -  Ancienne route -> ART
     -  Anciennes routes -> ART
-    -  Anse -> ANSE
     -  Arcade -> ARC
     -  Arcades -> ARC
     -  Autoroute -> AUT
     -  Avenue -> AV
-    -  Avenue -> Av
     -  BarriÃ¨re -> BRE
     -  BarriÃ¨res -> BRE
     -  Bas chemin -> BCH
@@ -28,16 +24,11 @@
     -  Berges -> BER
     -  Bois -> BOIS
     -  Boucle -> BCLE
-    -  Boulevard -> Bd
     -  Boulevard -> BD
     -  Bourg -> BRG
     -  Butte -> BUT
-    -  CitÃ© -> CITE
     -  CitÃ©s -> CITE
-    -  CÃ´te -> COTE
     -  CÃ´teau -> COTE
-    -  Cale -> CALE
-    -  Camp -> CAMP
     -  Campagne -> CGNE
     -  Camping -> CPG
     -  Carreau -> CAU
@@ -56,17 +47,13 @@
     -  ChaussÃ©es -> CHS
     -  Chemin -> Ch
     -  Chemin -> CHE
-    -  Chemin -> Che
     -  Chemin vicinal -> CHV
     -  Cheminement -> CHEM
     -  Cheminements -> CHEM
     -  Chemins -> CHE
     -  Chemins vicinaux -> CHV
-    -  Chez -> CHEZ
     -  ChÃ¢teau -> CHT
     -  CloÃ®tre -> CLOI
-    -  Clos -> CLOS
-    -  Col -> COL
     -  Colline -> COLI
     -  Collines -> COLI
     -  Contour -> CTR
@@ -74,9 +61,7 @@
     -  Corniches -> COR
     -  Cottage -> COTT
     -  Cottages -> COTT
-    -  Cour -> COUR
     -  Cours -> CRS
-    -  Cours -> Crs
     -  Darse -> DARS
     -  DegrÃ© -> DEG
     -  DegrÃ©s -> DEG
@@ -87,11 +72,8 @@
     -  Domaine -> DOM
     -  Domaines -> DOM
     -  Ãcluse -> ECL
-    -  Ãcluse -> ÃCL
     -  Ãcluses -> ECL
-    -  Ãcluses -> ÃCL
     -  Ãglise -> EGL
-    -  Ãglise -> ÃGL
     -  Enceinte -> EN
     -  Enclave -> ENV
     -  Enclos -> ENC
@@ -100,21 +82,16 @@
     -  Espace -> ESPA
     -  Esplanade -> ESP
     -  Esplanades -> ESP
-    -  Ãtang -> ETANG
-    -  Ãtang -> ÃTANG
     -  Faubourg -> FG
-    -  Faubourg -> Fg
     -  Ferme -> FRM
     -  Fermes -> FRM
     -  Fontaine -> FON
-    -  Fort -> FORT
     -  Forum -> FORM
     -  Fosse -> FOS
     -  Fosses -> FOS
     -  Foyer -> FOYR
     -  Galerie -> GAL
     -  Galeries -> GAL
-    -  Gare -> GARE
     -  Garenne -> GARN
     -  Grand boulevard -> GBD
     -  Grand ensemble -> GDEN
@@ -134,13 +111,9 @@
     -  Haut chemin -> HCH
     -  Hauts chemins -> HCH
     -  Hippodrome -> HIP
-    -  HLM -> HLM
-    -  Ãle -> ILE
-    -  Ãle -> ÃLE
     -  Immeuble -> IMM
     -  Immeubles -> IMM
     -  Impasse -> IMP
-    -  Impasse -> Imp
     -  Impasses -> IMP
     -  Jardin -> JARD
     -  Jardins -> JARD
@@ -150,13 +123,11 @@
     -  Lieu-dit -> LD
     -  Lotissement -> LOT
     -  Lotissements -> LOT
-    -  Mail -> MAIL
     -  Maison forestiÃ¨re -> MF
     -  Manoir -> MAN
     -  Marche -> MAR
     -  Marches -> MAR
     -  MarÃ©chal -> MAL
-    -  Mas -> MAS
     -  Monseigneur -> Mgr
     -  Mont -> Mt
     -  MontÃ©e -> MTE
@@ -168,13 +139,9 @@
     -  MÃ©tro -> MÃT
     -  Nouvelle route -> NTE
     -  Palais -> PAL
-    -  Parc -> PARC
-    -  Parcs -> PARC
     -  Parking -> PKG
     -  Parvis -> PRV
     -  Passage -> PAS
-    -  Passage -> Pas
-    -  Passage -> Pass
     -  Passage Ã  niveau -> PN
     -  Passe -> PASS
     -  Passerelle -> PLE
@@ -191,19 +158,14 @@
     -  Petite rue -> PTR
     -  Petites allÃ©es -> PTA
     -  Place -> PL
-    -  Place -> Pl
     -  Placis -> PLCI
     -  Plage -> PLAG
     -  Plages -> PLAG
     -  Plaine -> PLN
-    -  Plan -> PLAN
     -  Plateau -> PLT
     -  Plateaux -> PLT
     -  Pointe -> PNT
-    -  Pont -> PONT
-    -  Ponts -> PONT
     -  Porche -> PCH
-    -  Port -> PORT
     -  Porte -> PTE
     -  Portique -> PORQ
     -  Portiques -> PORQ
@@ -211,25 +173,19 @@
     -  Pourtour -> POUR
     -  PresquâÃ®le -> PRQ
     -  Promenade -> PROM
-    -  Promenade -> Prom
-    -  PrÃ© -> PRE
-    -  PrÃ© -> PRÃ
     -  PÃ©riphÃ©rique -> PERI
     -  PÃ©ristyle -> PSTY
     -  Quai -> QU
-    -  Quai -> Qu
     -  Quartier -> QUA
     -  Raccourci -> RAC
     -  Raidillon -> RAID
     -  Rampe -> RPE
     -  Rempart -> REM
-    -  Roc -> ROC
     -  Rocade -> ROC
     -  Rond point -> RPT
     -  Roquet -> ROQT
     -  Rotonde -> RTD
     -  Route -> RTE
-    -  Route -> Rte
     -  Routes -> RTE
     -  Rue -> R
     -  Rue -> R
@@ -245,7 +201,6 @@
     -  Sentier -> SEN
     -  Sentiers -> SEN
     -  Square -> SQ
-    -  Square -> Sq
     -  Stade -> STDE
     -  Station -> STA
     -  Terrain -> TRN
@@ -254,13 +209,11 @@
     -  Terre plein -> TPL
     -  Tertre -> TRT
     -  Tertres -> TRT
-    -  Tour -> TOUR
     -  Traverse -> TRA
     -  Vallon -> VAL
     -  VallÃ©e -> VAL
     -  Venelle -> VEN
     -  Venelles -> VEN
-    -  Via -> VIA
     -  Vieille route -> VTE
     -  Vieux chemin -> VCHE
     -  Villa -> VLA
@@ -269,7 +222,6 @@
     -  Villas -> VLA
     -  Voie -> VOI
     -  Voies -> VOI
-    -  Zone -> ZONE
     -  Zone artisanale -> ZA
     -  Zone d'amÃ©nagement concertÃ© -> ZAC
     -  Zone d'amÃ©nagement diffÃ©rÃ© -> ZAD
@@ -289,7 +241,6 @@
     -  Esplanade -> ESPL
     -  Passage -> PASS
     -  Plateau -> PLAT
-    -  Rang -> RANG
     -  Rond-point -> RDPT
     -  Sentier -> SENT
     -  Subdivision -> SUBDIV
diff --git a/settings/icu-rules/variants-it.yaml b/settings/icu-rules/variants-it.yaml
index 3e45521e..55678e1a 100644
--- a/settings/icu-rules/variants-it.yaml
+++ b/settings/icu-rules/variants-it.yaml
@@ -29,7 +29,6 @@
     -  Prima -> I
     -  Primo -> I
     -  Primo -> 1
-    -  Primo -> 1Â°
     -  Quarta -> IV
     -  Quarto -> IV
     -  Quattro -> IV
diff --git a/settings/icu-rules/variants-no.yaml b/settings/icu-rules/variants-no.yaml
index de75e3c3..dd17408f 100644
--- a/settings/icu-rules/variants-no.yaml
+++ b/settings/icu-rules/variants-no.yaml
@@ -1,11 +1,10 @@
 # Source: https://wiki.openstreetmap.org/wiki/Name_finder:Abbreviations#Norsk_-_Norwegian
-- lang: no
+- lang: "no"
   words:
     # convert between Nynorsk and Bookmal here
-    -  vei, veg => v,vn,vei,veg
-    -  veien, vegen -> v,vn,veien,vegen
-    -  gate -> g,gt
+    -  ~vei, ~veg -> v,vei,veg
+    -  ~veien, ~vegen -> vn,veien,vegen
     # convert between the two female forms
-    -  gaten, gata => g,gt,gaten,gata
+    -  gate, gaten, gata -> g,gt
     -  plass, plassen -> pl
     -  sving, svingen -> sv
diff --git a/settings/icu-rules/variants-ru.yaml b/settings/icu-rules/variants-ru.yaml
index 2092e32e..87f872c5 100644
--- a/settings/icu-rules/variants-ru.yaml
+++ b/settings/icu-rules/variants-ru.yaml
@@ -1,14 +1,128 @@
 # Source: https://wiki.openstreetmap.org/wiki/Name_finder:Abbreviations#.D0.A0.D1.83.D1.81.D1.81.D0.BA.D0.B8.D0.B9_-_Russian
+# Source: https://www.plantarium.ru/page/help/topic/abbreviations.html
+# Source: https://dic.academic.ru/dic.nsf/ruwiki/1871310
 - lang: ru
   words:
+    -  ÐÐºÐ°Ð´ÐµÐ¼Ð¸Ðº, ÐÐºÐ°Ð´ÐµÐ¼Ð¸ÐºÐ° -> ÐÐº
+    -  Ð°ÐºÑÐ¸Ð¾Ð½ÐµÑÐ½Ð¾Ðµ Ð¾Ð±ÑÐµÑÑÐ²Ð¾ -> ÐÐ
     -  Ð°Ð»Ð»ÐµÑ -> Ð°Ð»
+    -  Ð°ÑÑÐ¸Ð¿ÐµÐ»Ð°Ð³ -> Ð°ÑÑ
+    -  Ð°ÑÐ¾Ð¼Ð½Ð°Ñ ÑÐ»ÐµÐºÑÑÐ¾ÑÑÐ°Ð½ÑÐ¸Ñ -> ÐÐ­Ð¡
+    -  Ð°ÑÑÐ¾Ð´ÑÐ¾Ð¼ -> Ð°ÑÑÐ´
+    -  Ð°ÑÑÐ¾Ð¿Ð¾ÑÑ -> Ð°ÑÑÐ¿
+    -  ÐÐ°ÑÐºÐ¸ÑÑÐºÐ¸Ð¹, ÐÐ°ÑÐºÐ¸ÑÑÐºÐ°Ñ, ÐÐ°ÑÐºÐ¸ÑÑÐºÐ¾Ðµ, ÐÐ°ÑÐºÐ¸ÑÑÐºÐ¸Ðµ -> ÐÐ°Ñ, ÐÐ°ÑÐº, ÐÐ°ÑÐºÐ¸Ñ
+    -  ÐÐµÐ»ÑÐ¹, ÐÐµÐ»Ð°Ñ, ÐÐµÐ»Ð¾Ðµ. ÐÐµÐ»ÑÐµ -> ÐÐµÐ»
+    -  Ð±Ð¾Ð»Ð¾ÑÐ¾ -> Ð±Ð¾Ð»
+    -  Ð±Ð¾Ð»ÑÐ½Ð¸ÑÐ° -> Ð±Ð¾Ð»ÑÐ½
+    -  ÐÐ¾Ð»ÑÑÐ¾Ð¹, ÐÐ¾Ð»ÑÑÐ°Ñ, ÐÐ¾Ð»ÑÑÐ¾Ðµ, ÐÐ¾Ð»ÑÑÐ¸Ðµ -> Ð, ÐÐ¾Ð»
+    -  Ð±ÑÐ¾Ð´ -> Ð±Ñ
     -  Ð±ÑÐ»ÑÐ²Ð°Ñ -> Ð±ÑÐ»
+    -  Ð±ÑÑÑÐ° -> Ð±ÑÑ
+    -  Ð±ÑÐ²ÑÐ¸Ð¹, Ð±ÑÐ²ÑÐ°Ñ, Ð±ÑÐ²ÑÐµÐµ, Ð±ÑÐ²ÑÐ¸Ðµ -> Ð±ÑÐ²Ñ
+    -  ÐÐµÐ»Ð¸ÐºÐ¸Ð¹, ÐÐµÐ»Ð¸ÐºÐ°Ñ, ÐÐµÐ»Ð¸ÐºÐ¾Ðµ, ÐÐµÐ»Ð¸ÐºÐ¸Ðµ -> ÐÐµÐ»
+    -  ÐÐµÑÑÐ½Ð¸Ð¹, ÐÐµÑÑÐ½ÑÑ, ÐÐµÑÑÐ½ÐµÐµ, ÐÐµÑÑÐ½Ð¸Ðµ -> Ð, ÐÐµÑÑ
+    -  Ð²Ð¾Ð´Ð¾ÐºÐ°ÑÐºÐ° -> Ð²Ð´ÐºÑ
+    -  Ð²Ð¾Ð´Ð¾Ð¿Ð°Ð´ -> Ð²Ð´Ð¿
+    -  Ð²Ð¾Ð´Ð¾ÑÑÐ°Ð½Ð¸Ð»Ð¸ÑÐµ -> Ð²Ð´ÑÑ
+    -  Ð²Ð¾ÐºÐ·Ð°Ð» -> Ð²ÐºÐ·, Ð²Ð¾ÐºÐ·
+    -  ÐÐ¾ÑÑÐ¾ÑÐ½ÑÐ¹, ÐÐ¾ÑÑÐ¾ÑÐ½Ð°Ñ, ÐÐ¾ÑÑÐ¾ÑÐ½Ð¾Ðµ, ÐÐ¾ÑÑÐ¾ÑÐ½ÑÐµ -> Ð, ÐÐ¾ÑÑ
+    -  Ð²ÑÐ»ÐºÐ°Ð½ -> Ð²Ð»Ðº
+    -  Ð³Ð¸Ð´ÑÐ¾ÑÐ»ÐµÐºÑÑÐ¾ÑÑÐ°Ð½ÑÐ¸Ñ -> ÐÐ­Ð¡
+    -  Ð³Ð¾ÑÐ° -> Ð³
+    -  Ð³Ð¾ÑÐ¾Ð´ -> Ð³
+    -  Ð´Ð²Ð¾ÑÐµÑ ÐºÑÐ»ÑÑÑÑÑ, Ð´Ð¾Ð¼ ÐºÑÐ»ÑÑÑÑÑ -> ÐÐ
+    -  Ð´Ð²Ð¾ÑÐµÑ ÑÐ¿Ð¾ÑÑÐ° -> ÐÐ¡
+    -  Ð´ÐµÑÐµÐ²Ð½Ñ -> Ð´, Ð´ÐµÑ
+    -  Ð´ÐµÑÑÐºÐ¸Ð¹ Ð¾Ð·Ð´Ð¾ÑÐ¾Ð²Ð¸ÑÐµÐ»ÑÐ½ÑÐ¹ Ð»Ð°Ð³ÐµÑÑ -> ÐÐÐ
+    -  Ð´Ð¾Ð¼ -> Ð´
+    -  Ð´Ð¾Ð¼ Ð¾ÑÐ´ÑÑÐ° -> Ð Ð
+    -  Ð¶ÐµÐ»ÐµÐ·Ð½Ð°Ñ Ð´Ð¾ÑÐ¾Ð³Ð° -> Ð¶ Ð´
+    -  Ð¶ÐµÐ»ÐµÐ·Ð½Ð¾Ð´Ð¾ÑÐ¾Ð¶Ð½ÑÐ¹, Ð¶ÐµÐ»ÐµÐ·Ð½Ð¾Ð´Ð¾ÑÐ¾Ð¶Ð½Ð°Ñ, Ð¶ÐµÐ»ÐµÐ·Ð½Ð¾Ð´Ð¾ÑÐ¾Ð¶Ð½Ð¾Ðµ -> Ð¶-Ð´
+    -  Ð¶ÐµÐ»ÐµÐ·Ð¾Ð±ÐµÑÐ¾Ð½Ð½ÑÑ Ð¸Ð·Ð´ÐµÐ»Ð¸Ð¹ -> ÐÐÐ
+    -  Ð¶Ð¸Ð»Ð¾Ð¹ ÐºÐ¾Ð¼Ð¿Ð»ÐµÐºÑ -> ÐÐ
+    -  Ð·Ð°Ð²Ð¾Ð´ -> Ð·-Ð´
+    -  Ð·Ð°ÐºÑÑÑÐ¾Ðµ Ð°Ð´Ð¼Ð¸Ð½Ð¸ÑÑÑÐ°ÑÐ¸Ð²Ð½Ð¾-ÑÐµÑÑÐ¸ÑÐ¾ÑÐ¸Ð°Ð»ÑÐ½Ð¾Ðµ Ð¾Ð±ÑÐ°Ð·Ð¾Ð²Ð°Ð½Ð¸Ðµ -> ÐÐÐ¢Ð
+    -  Ð·Ð°Ð»Ð¸Ð² -> Ð·Ð°Ð»
+    -  ÐÐ°Ð¿Ð°Ð´Ð½ÑÐ¹, ÐÐ°Ð¿Ð°Ð´Ð½Ð°Ñ, ÐÐ°Ð¿Ð°Ð´Ð½Ð¾Ðµ, ÐÐ°Ð¿Ð°Ð´Ð½ÑÐµ -> Ð, ÐÐ°Ð¿, ÐÐ°Ð¿Ð°Ð´
+    -  Ð·Ð°Ð¿Ð¾Ð²ÐµÐ´Ð½Ð¸Ðº -> Ð·Ð°Ð¿Ð¾Ð²
+    -  Ð¸Ð¼ÐµÐ½Ð¸ -> Ð¸Ð¼
+    -  Ð¸Ð½ÑÑÐ¸ÑÑÑ -> Ð¸Ð½ÑÑ
+    -  Ð¸ÑÐ¿ÑÐ°Ð²Ð¸ÑÐµÐ»ÑÐ½Ð°Ñ ÐºÐ¾Ð»Ð¾Ð½Ð¸Ñ -> ÐÐ
+    -  ÐºÐ¸Ð»Ð¾Ð¼ÐµÑÑ -> ÐºÐ¼
+    -  ÐÑÐ°ÑÐ½ÑÐ¹, ÐÑÐ°ÑÐ½Ð°Ñ, ÐÑÐ°ÑÐ½Ð¾Ðµ, ÐÑÐ°ÑÐ½ÑÐµ -> ÐÑ, ÐÑÐ°Ñ
+    -  Ð»Ð°Ð³ÐµÑÑ -> Ð»Ð°Ð³
+    -  ÐÐµÐ²ÑÐ¹, ÐÐµÐ²Ð°Ñ,ÐÐµÐ²Ð¾Ðµ, ÐÐµÐ²ÑÐµ -> Ð, ÐÐµÐ²
+    -  Ð»ÐµÐ´Ð½Ð¸Ðº -> Ð»ÐµÐ´Ð½
+    -  Ð»ÐµÑÐ½Ð¸ÑÐµÑÑÐ²Ð¾ -> Ð»ÐµÑÐ½Ð¸Ñ
+    -  Ð»ÐµÑÐ½Ð¾Ð¹, Ð»ÐµÑÐ½Ð°Ñ, Ð»ÐµÑÐ½Ð¾Ðµ -> Ð»ÐµÑ
+    -  Ð»Ð¸Ð½Ð¸Ñ ÑÐ»ÐµÐºÑÑÐ¾Ð¿ÐµÑÐµÐ´Ð°ÑÐ¸ -> ÐÐ­Ð
+    -  ÐÐ°Ð»ÑÐ¹, ÐÐ°Ð»Ð°Ñ, ÐÐ°Ð»Ð¾Ðµ, ÐÐ°Ð»ÑÐµ -> Ð, ÐÐ°Ð»
+    -  ÐÐ¾ÑÐ´Ð¾Ð²ÑÐºÐ¸Ð¹, ÐÐ¾ÑÐ´Ð¾Ð²ÑÐºÐ°Ñ, ÐÐ¾ÑÐ´Ð¾Ð²ÑÐºÐ¾Ðµ, ÐÐ¾ÑÐ´Ð¾Ð²ÑÐºÐ¸Ðµ -> ÐÐ¾ÑÐ´Ð¾Ð²
+    -  Ð¼Ð¾ÑÑÐºÐ¾Ð¹, Ð¼Ð¾ÑÑÐºÐ°Ñ, Ð¼Ð¾ÑÑÐºÐ¾Ðµ -> Ð¼Ð¾Ñ
+    -  ÐÐ¾ÑÐºÐ¾Ð²ÑÐºÐ¸Ð¹, ÐÐ¾ÑÐºÐ¾Ð²ÑÐºÐ°Ñ, ÐÐ¾ÑÐºÐ¾Ð²ÑÐºÐ¾Ðµ, ÐÐ¾ÑÐºÐ¾Ð²ÑÐºÐ¸Ðµ -> ÐÐ¾Ñ, ÐÐ¾ÑÐº
+    -  Ð¼ÑÑ -> Ð¼
     -  Ð½Ð°Ð±ÐµÑÐµÐ¶Ð½Ð°Ñ -> Ð½Ð°Ð±
+    -  ÐÐ¸Ð¶Ð½Ð¸Ð¹, ÐÐ¸Ð¶Ð½ÑÑ, ÐÐ¸Ð¶Ð½ÐµÐµ, ÐÐ¸Ð¶Ð½Ð¸Ðµ -> ÐÐ¸Ð¶, Ð
+    -  ÐÐ¾Ð²ÑÐ¹, ÐÐ¾Ð²Ð°Ñ, ÐÐ¾Ð²Ð¾Ðµ, ÐÐ¾Ð²ÑÐµ -> ÐÐ¾Ð², Ð
+    -  Ð¾Ð±Ð³Ð¾Ð½Ð½ÑÐ¹ Ð¿ÑÐ½ÐºÑ -> Ð¾Ð±Ð³ Ð¿
+    -  Ð¾Ð±Ð»Ð°ÑÑÑ -> Ð¾Ð±Ð»
+    -  Ð¾Ð·ÐµÑÐ¾ -> Ð¾Ð·
+    -  Ð¾ÑÐ¾Ð±Ð¾ Ð¾ÑÑÐ°Ð½ÑÐµÐ¼Ð°Ñ Ð¿ÑÐ¸ÑÐ¾Ð´Ð½Ð°Ñ ÑÐµÑÑÐ¸ÑÐ¾ÑÐ¸Ñ -> ÐÐÐÐ¢
+    -  Ð¾ÑÑÐ°Ð½Ð¾Ð²Ð¾ÑÐ½ÑÐ¹ Ð¿ÑÐ½ÐºÑ -> Ð¾ Ð¿
+    -  Ð¾ÑÑÑÐ¾Ð² -> Ð¾
+    -  Ð¾ÑÑÑÐ¾Ð²Ð° -> Ð¾-Ð²Ð°
+    -  Ð¿Ð°ÑÐº ÐºÑÐ»ÑÑÑÑÑ Ð¸ Ð¾ÑÐ´ÑÑÐ° -> ÐÐÐ¸Ð
+    -  Ð¿ÐµÑÐµÐ²Ð°Ð» -> Ð¿ÐµÑ
     -  Ð¿ÐµÑÐµÑÐ»Ð¾Ðº -> Ð¿ÐµÑ
+    -  Ð¿ÐµÑÐµÑÐ° -> Ð¿ÐµÑ
+    -  Ð¿Ð¸Ð¾Ð½ÐµÑÑÐºÐ¸Ð¹ Ð»Ð°Ð³ÐµÑÑ -> Ð¿Ð¸Ð¾Ð½ÐµÑÐ»Ð°Ð³
+    -  Ð¿Ð»Ð°ÑÑÐ¾ÑÐ¼Ð° -> Ð¿Ð», Ð¿Ð»Ð°ÑÑ
     -  Ð¿Ð»Ð¾ÑÐ°Ð´Ñ -> Ð¿Ð»
+    -  Ð¿Ð¾Ð´ÑÐ¾Ð±Ð½Ð¾Ðµ ÑÐ¾Ð·ÑÐ¹ÑÑÐ²Ð¾ -> Ð¿Ð¾Ð´ÑÐ¾Ð± ÑÐ¾Ð·
+    -  Ð¿Ð¾Ð»ÑÐ¾ÑÑÑÐ¾Ð² -> Ð¿-Ð¾Ð²
+    -  Ð¿Ð¾ÑÑÐ»Ð¾Ðº -> Ð¿Ð¾Ñ, Ð¿
+    -  Ð¿Ð¾ÑÑÐ»Ð¾Ðº Ð³Ð¾ÑÐ¾Ð´ÑÐºÐ¾Ð³Ð¾ ÑÐ¸Ð¿Ð° -> Ð¿ Ð³ Ñ, Ð¿Ð³Ñ
+    -  ÐÑÐ°Ð²ÑÐ¹, ÐÑÐ°Ð²Ð°Ñ, ÐÑÐ°Ð²Ð¾Ðµ, ÐÑÐ°Ð²ÑÐµ -> Ð, ÐÑ, ÐÑÐ°Ð²
     -  Ð¿ÑÐ¾ÐµÐ·Ð´ -> Ð¿Ñ
     -  Ð¿ÑÐ¾ÑÐ¿ÐµÐºÑ -> Ð¿ÑÐ¾ÑÐ¿
-    -  ÑÐ¾ÑÑÐµ -> Ñ
+    -  Ð¿ÑÑÐ´ -> Ð¿Ñ
+    -  Ð¿ÑÑÑÑÐ½Ñ -> Ð¿ÑÑÑ
+    -  ÑÐ°Ð·ÑÐµÐ·Ð´ -> ÑÐ·Ð´
+    -  ÑÐ°Ð¹Ð¾Ð½ -> Ñ-Ð½
+    -  ÑÐµÐ·Ð¸Ð½Ð¾ÑÐµÑÐ½Ð¸ÑÐµÑÐºÐ¸Ñ Ð¸Ð·Ð´ÐµÐ»Ð¸Ð¹ -> Ð Ð¢Ð
+    -  ÑÐµÐºÐ° -> Ñ
+    -  ÑÐµÑÐ½Ð¾Ð¹, ÑÐµÑÐ½Ð°Ñ, ÑÐµÑÐ½Ð¾Ðµ -> ÑÐµÑ, ÑÐµÑÐ½
+    -  Ð Ð¾ÑÑÐ¸Ð¹ÑÐºÐ¸Ð¹, Ð Ð¾ÑÑÐ¸Ð¹ÑÐºÐ°Ñ, Ð Ð¾ÑÑÐ¸Ð¹ÑÐºÐ¾Ðµ, Ð Ð¾ÑÑÐ¸Ð¹ÑÐºÐ¸Ðµ -> Ð Ð¾Ñ
+    -  Ð ÑÑÑÐºÐ¸Ð¹, Ð ÑÑÑÐºÐ°Ñ, Ð ÑÑÑÐºÐ¾Ðµ, Ð ÑÑÑÐºÐ¸Ðµ -> Ð ÑÑ, Ð ÑÑÑÐº
+    -  ÑÑÑÐµÐ¹ -> ÑÑÑ
+    -  ÑÐ°Ð´Ð¾Ð²Ð¾Ðµ Ð½ÐµÐºÐ¾Ð¼Ð¼ÐµÑÑÐµÑÐºÐ¾Ðµ ÑÐ¾Ð²Ð°ÑÐ¸ÑÐµÑÑÐ²Ð¾ -> Ð¡ÐÐ¢
+    -  ÑÐ°Ð´Ð¾Ð²ÑÐµ ÑÑÐ°ÑÑÐºÐ¸ -> ÑÐ°Ð´ ÑÑ
+    -  ÑÐ°Ð½Ð°ÑÐ¾ÑÐ¸Ð¹ -> ÑÐ°Ð½
+    -  ÑÐ°ÑÐ°Ð¹ -> ÑÐ°Ñ
+    -  Ð¡ÐµÐ²ÐµÑÐ½ÑÐ¹, Ð¡ÐµÐ²ÐµÑÐ½Ð°Ñ, Ð¡ÐµÐ²ÐµÑÐ½Ð¾Ðµ, Ð¡ÐµÐ²ÐµÑÐ½ÑÐµ -> Ð¡, Ð¡ÐµÐ²
+    -  ÑÐµÐ»Ð¾ -> Ñ
+    -  Ð¡Ð¸Ð±Ð¸ÑÑÐºÐ¸Ð¹, Ð¡Ð¸Ð±Ð¸ÑÑÐºÐ°Ñ, Ð¡Ð¸Ð±Ð¸ÑÑÐºÐ¾Ðµ, Ð¡Ð¸Ð±Ð¸ÑÑÐºÐ¸Ðµ -> Ð¡Ð¸Ð±
+    -  Ð¡Ð¾Ð²ÐµÑÑÐºÐ¸Ð¹, Ð¡Ð¾Ð²ÐµÑÑÐºÐ°Ñ, Ð¡Ð¾Ð²ÐµÑÑÐºÐ¾Ðµ, Ð¡Ð¾Ð²ÐµÑÑÐºÐ¸Ðµ -> Ð¡Ð¾Ð²
+    -  ÑÐ¾Ð²ÑÐ¾Ð· -> ÑÐ²Ñ
+    -  Ð¡Ð¾ÑÑÐ¸ÑÐ¾Ð²Ð¾ÑÐ½ÑÐ¹, Ð¡Ð¾ÑÑÐ¸ÑÐ¾Ð²Ð¾ÑÐ½Ð°Ñ, Ð¡Ð¾ÑÑÐ¸ÑÐ¾Ð²Ð¾ÑÐ½Ð¾Ðµ, Ð¡Ð¾ÑÑÐ¸ÑÐ¾Ð²Ð¾ÑÐ½ÑÐµ -> Ð¡Ð¾ÑÑ
+    -  ÑÑÐ°Ð½ÑÐ¸Ñ -> ÑÑ
+    -  Ð¡ÑÐ°ÑÑÐ¹, Ð¡ÑÐ°ÑÐ°Ñ, Ð¡ÑÐµÐ´Ð½ÐµÐµ, Ð¡ÑÐµÐ´Ð½Ð¸Ðµ -> Ð¡Ñ
+    -  Ð¢Ð°ÑÐ°ÑÑÐºÐ¸Ð¹, Ð¢Ð°ÑÐ°ÑÑÐºÐ°Ñ, Ð¢Ð°ÑÐ°ÑÑÐºÐ¾Ðµ, Ð¢Ð°ÑÐ°ÑÑÐºÐ¸Ðµ -> Ð¢Ð°Ñ, Ð¢Ð°ÑÐ°Ñ
+    -  ÑÐµÐ¿Ð»Ð¾ÑÐ»ÐµÐºÑÑÑÐ¾ÑÑÐ°Ð½ÑÐ¸Ñ -> Ð¢Ð­Ð¡
+    -  ÑÐµÐ¿Ð»Ð¾ÑÐ»ÐµÐºÑÑÐ¾ÑÐµÐ½ÑÑÐ°Ð»Ñ -> Ð¢Ð­Ð¦
+    -  ÑÐµÑÐ½Ð¸ÐºÑÐ¼ -> ÑÐµÑÐ½
+    -  ÑÐ¾Ð½Ð½ÐµÐ»Ñ, ÑÑÐ½Ð½ÐµÐ»Ñ -> ÑÑÐ½
     -  ÑÑÐ¿Ð¸Ðº -> ÑÑÐ¿
     -  ÑÐ»Ð¸ÑÐ° -> ÑÐ»
-    -  Ð¾Ð±Ð»Ð°ÑÑÑ -> Ð¾Ð±Ð»
+    -  Ð£ÑÐ°Ð»ÑÑÐºÐ¸Ð¹, Ð£ÑÐ°Ð»ÑÑÐºÐ°Ñ, Ð£ÑÐ°Ð»ÑÑÐºÐ¾Ðµ, Ð£ÑÐ°Ð»ÑÑÐºÐ¸Ðµ -> Ð£Ñ, Ð£ÑÐ°Ð»
+    -  ÑÑÐ¾ÑÐ¸ÑÐµ -> ÑÑ
+    -  ÑÐ¾Ð·ÑÐ¹ÑÑÐ²Ð¾ -> ÑÐ¾Ð·, ÑÐ¾Ð·-Ð²Ð¾
+    -  ÑÑÐµÐ±ÐµÑ -> ÑÑ
+    -  ÑÑÑÐ¾Ñ -> ÑÑÑ
+    -  Ð§ÑÑÐ½ÑÐ¹, Ð§ÑÑÐ½Ð°Ñ, Ð§ÑÑÐ½Ð¾Ðµ, Ð§ÑÑÐ½ÑÐµ -> Ð§ÐµÑÐ½
+    -  Ð§ÑÐ²Ð°ÑÑÐºÐ¸Ð¹, Ð§ÑÐ²Ð°ÑÑÐºÐ°Ñ, Ð§ÑÐ²Ð°ÑÑÐºÐ¾Ðµ, Ð§ÑÐ²Ð°ÑÑÐºÐ¸Ðµ -> Ð§ÑÐ²Ð°Ñ
+    -  ÑÐ°ÑÑÐ° -> ÑÐ°Ñ
+    -  ÑÐºÐ¾Ð»Ð° -> ÑÐº
+    -  ÑÐ¾ÑÑÐµ -> Ñ
+    -  ÑÐ»ÐµÐ²Ð°ÑÐ¾Ñ -> ÑÐ»ÐµÐ²
+    -  Ð®Ð¶Ð½ÑÐ¹, Ð®Ð¶Ð½Ð°Ñ, Ð®Ð¶Ð½Ð¾Ðµ, Ð®Ð¶Ð½ÑÐµ -> Ð®, Ð®Ð¶, Ð®Ð¶Ð½
\ No newline at end of file
diff --git a/settings/icu_tokenizer.yaml b/settings/icu_tokenizer.yaml
index c5a809c6..bb81f80b 100644
--- a/settings/icu_tokenizer.yaml
+++ b/settings/icu_tokenizer.yaml
@@ -1,3 +1,6 @@
+query-preprocessing:
+    - step: split_japanese_phrases
+    - step: normalize
 normalization:
     - ":: lower ()"
     - ":: Hans-Hant"
@@ -7,16 +10,17 @@ normalization:
     - "'nÂº' > 'no'"
     - "Âª > a"
     - "Âº > o"
-    - "[[:Punctuation:][:Symbol:]\u02bc]  > ' '"
+    - "[[:Punctuation:][:Symbol:][\u02bc] - [-:]]+  > '-'"
     - "Ã > 'ss'" # German szet is unambiguously equal to double ss
-    - "[^[:alnum:] [:Canonical_Combining_Class=Virama:] [:Space:]] >"
+    - "[^[:alnum:] [:Canonical_Combining_Class=Virama:] [:Space:] [-:]] >"
     - "[:Lm:] >"
     - ":: [[:Number:]] Latin ()"
     - ":: [[:Number:]] Ascii ();"
     - ":: [[:Number:]] NFD ();"
     - "[[:Nonspacing Mark:] [:Cf:]] >;"
-    - "[:Space:]+ > ' '"
+    - "[-:]?[:Space:]+[-:]? > ' '"
 transliteration:
+    - "[-:]  > ' '"
     - ":: Latin ()"
     - !include icu-rules/extended-unicode-to-asccii.yaml
     - ":: Ascii ()"
@@ -42,7 +46,7 @@ sanitizers:
     - step: strip-brace-terms
     - step: tag-analyzer-by-language
       filter-kind: [".*name.*"]
-      whitelist: [bg,ca,cs,da,de,el,en,es,et,eu,fi,fr,gl,hu,it,ja,mg,ms,nl,no,pl,pt,ro,ru,sk,sl,sv,tr,uk,vi]
+      whitelist: [bg,ca,cs,da,de,el,en,es,et,eu,fi,fr,gl,hu,it,ja,mg,ms,nl,"no",pl,pt,ro,ru,sk,sl,sv,tr,uk,vi]
       use-defaults: all
       mode: append
     - step: tag-japanese
@@ -154,7 +158,7 @@ token-analysis:
       mode: variant-only
       variants:
           - !include icu-rules/variants-nl.yaml
-    - id: no
+    - id: "no"
       analyzer: generic
       mode: variant-only
       variants:
diff --git a/settings/import-address.lua b/settings/import-address.lua
deleted file mode 100644
index b177b73c..00000000
--- a/settings/import-address.lua
+++ /dev/null
@@ -1,74 +0,0 @@
-local flex = require('flex-base')
-
-flex.set_main_tags{
-    highway = {motorway = 'always',
-               trunk = 'always',
-               primary = 'always',
-               secondary = 'always',
-               tertiary = 'always',
-               unclassified = 'always',
-               residential = 'always',
-               road = 'always',
-               living_street = 'always',
-               pedestrian = 'always',
-               service = 'named',
-               cycleway = 'named',
-               path = 'named',
-               footway = 'named',
-               steps = 'named',
-               bridleway = 'named',
-               track = 'named',
-               motorway_link = 'named',
-               trunk_link = 'named',
-               primary_link = 'named',
-               secondary_link = 'named',
-               tertiary_link = 'named'},
-    boundary = {administrative = 'named',
-                postal_code = 'always'},
-    landuse = 'fallback',
-    place = 'always'
-}
-
-flex.set_prefilters{delete_keys = {'building', 'source',
-                                   'source', '*source', 'type',
-                                   'is_in:postcode', '*:wikidata', '*:wikipedia',
-                                   '*:prefix', '*:suffix', 'name:prefix:*', 'name:suffix:*',
-                                   'name:etymology', 'name:signed', 'name:botanical',
-                                   'addr:street:name', 'addr:street:type'},
-                    delete_tags = {landuse = {'cemetry', 'no'},
-                                   boundary = {'place'}},
-                    extra_keys = {'wikipedia', 'wikipedia:*', 'wikidata', 'capital', 'area'}
-                   }
-
-flex.set_name_tags{main = {'name', 'name:*',
-                          'int_name', 'int_name:*',
-                          'nat_name', 'nat_name:*',
-                          'reg_name', 'reg_name:*',
-                          'loc_name', 'loc_name:*',
-                          'old_name', 'old_name:*',
-                          'alt_name', 'alt_name:*', 'alt_name_*',
-                          'official_name', 'official_name:*',
-                          'place_name', 'place_name:*',
-                          'short_name', 'short_name:*'},
-                   extra = {'ref', 'int_ref', 'nat_ref', 'reg_ref',
-                            'loc_ref', 'old_ref',
-                            'iata', 'icao', 'pcode', 'pcode:*', 'ISO3166-2'},
-                   house = {'addr:housename'}
-                  }
-
-flex.set_address_tags{main = {'addr:housenumber',
-                              'addr:conscriptionnumber',
-                              'addr:streetnumber'},
-                      extra = {'addr:*', 'is_in:*', 'tiger:county'},
-                      postcode = {'postal_code', 'postcode', 'addr:postcode',
-                                  'tiger:zip_left', 'tiger:zip_right'},
-                      country = {'country_code', 'ISO3166-1',
-                                 'addr:country_code', 'is_in:country_code',
-                                 'addr:country', 'is_in:country'},
-                      interpolation = {'addr:interpolation'}
-                     }
-
-
-flex.set_unused_handling{extra_keys = {'place'}}
-
-return flex
diff --git a/settings/import-admin.lua b/settings/import-admin.lua
deleted file mode 100644
index 78eac5f5..00000000
--- a/settings/import-admin.lua
+++ /dev/null
@@ -1,72 +0,0 @@
-local flex = require('flex-base')
-
-flex.set_main_tags{
-    boundary = {administrative = 'named'},
-    landuse = {residential = 'fallback',
-               farm = 'fallback',
-               farmyard = 'fallback',
-               industrial = 'fallback',
-               commercial = 'fallback',
-               allotments = 'fallback',
-               retail = 'fallback'},
-    place = {county = 'always',
-             district = 'always',
-             municipality = 'always',
-             city = 'always',
-             town = 'always',
-             borough = 'always',
-             village = 'always',
-             suburb = 'always',
-             hamlet = 'always',
-             croft = 'always',
-             subdivision = 'always',
-             allotments = 'always',
-             neighbourhood = 'always',
-             quarter = 'always',
-             isolated_dwelling = 'always',
-             farm = 'always',
-             city_block = 'always',
-             mountain_pass = 'always',
-             square = 'always',
-             locality = 'always'}
-}
-
-flex.set_prefilters{delete_keys = {'building', 'source', 'highway',
-                                   'addr:housenumber', 'addr:street', 'addr:city',
-                                   'addr:interpolation',
-                                   'source', '*source', 'type',
-                                   'is_in:postcode', '*:wikidata', '*:wikipedia',
-                                   '*:prefix', '*:suffix', 'name:prefix:*', 'name:suffix:*',
-                                   'name:etymology', 'name:signed', 'name:botanical',
-                                   'addr:street:name', 'addr:street:type'},
-                    delete_tags = {landuse = {'cemetry', 'no'},
-                                   boundary = {'place'}},
-                    extra_keys = {'wikipedia', 'wikipedia:*', 'wikidata', 'capital'}
-                   }
-
-flex.set_name_tags{main = {'name', 'name:*',
-                          'int_name', 'int_name:*',
-                          'nat_name', 'nat_name:*',
-                          'reg_name', 'reg_name:*',
-                          'loc_name', 'loc_name:*',
-                          'old_name', 'old_name:*',
-                          'alt_name', 'alt_name:*', 'alt_name_*',
-                          'official_name', 'official_name:*',
-                          'place_name', 'place_name:*',
-                          'short_name', 'short_name:*'},
-                   extra = {'ref', 'int_ref', 'nat_ref', 'reg_ref',
-                            'loc_ref', 'old_ref',
-                            'iata', 'icao', 'pcode', 'pcode:*', 'ISO3166-2'}
-                  }
-
-flex.set_address_tags{extra = {'addr:*', 'is_in:*'},
-                      postcode = {'postal_code', 'postcode', 'addr:postcode'},
-                      country = {'country_code', 'ISO3166-1',
-                                 'addr:country_code', 'is_in:country_code',
-                                 'addr:country', 'is_in:country'},
-                      postcode_fallback = false
-                     }
-
-flex.set_unused_handling{extra_keys = {'place'}}
-
-return flex
diff --git a/settings/import-extratags.lua b/settings/import-extratags.lua
deleted file mode 100644
index 0d242b0f..00000000
--- a/settings/import-extratags.lua
+++ /dev/null
@@ -1,126 +0,0 @@
-local flex = require('flex-base')
-
-flex.set_main_tags{
-    building = 'fallback',
-    emergency = 'always',
-    healthcare = 'fallback',
-    historic = 'always',
-    military = 'always',
-    natural = 'named',
-    highway = {'always',
-               street_lamp = 'named',
-               traffic_signals = 'named',
-               service = 'named',
-               cycleway = 'named',
-               path = 'named',
-               footway = 'named',
-               steps = 'named',
-               bridleway = 'named',
-               track = 'named',
-               motorway_link = 'named',
-               trunk_link = 'named',
-               primary_link = 'named',
-               secondary_link = 'named',
-               tertiary_link = 'named'},
-    railway = 'named',
-    man_made = {'none',
-                pier = 'always',
-                tower = 'always',
-                bridge = 'always',
-                works = 'named',
-                water_tower = 'always',
-                dyke = 'named',
-                adit = 'named',
-                lighthouse = 'always',
-                watermill = 'always',
-                tunnel = 'always'},
-    aerialway = 'always',
-    boundary = {'named',
-                postal_code = 'always'},
-    aeroway = 'always',
-    amenity = 'always',
-    club = 'always',
-    craft = 'always',
-    junction = 'fallback',
-    landuse = 'fallback',
-    leisure = {'always',
-               nature_reserve = 'fallback'},
-    office = 'always',
-    mountain_pass = 'always',
-    shop = 'always',
-    tourism = 'always',
-    bridge = 'named_with_key',
-    tunnel = 'named_with_key',
-    waterway = 'named',
-    place = 'always'
-}
-
-flex.set_prefilters{delete_keys = {'note', 'note:*', 'source', '*source', 'attribution',
-                                   'comment', 'fixme', 'FIXME', 'created_by', 'NHD:*',
-                                   'nhd:*', 'gnis:*', 'geobase:*', 'KSJ2:*', 'yh:*',
-                                   'osak:*', 'naptan:*', 'CLC:*', 'import', 'it:fvg:*',
-                                   'type', 'lacounty:*', 'ref:ruian:*', 'building:ruian:type',
-                                   'ref:linz:*', 'is_in:postcode'},
-                    delete_tags = {emergency = {'yes', 'no', 'fire_hydrant'},
-                                   historic = {'yes', 'no'},
-                                   military = {'yes', 'no'},
-                                   natural = {'yes', 'no', 'coastline'},
-                                   highway = {'no', 'turning_circle', 'mini_roundabout',
-                                              'noexit', 'crossing', 'give_way', 'stop'},
-                                   railway = {'level_crossing', 'no', 'rail', 'switch',
-                                              'abandoned', 'signal', 'buffer_stop', 'razed'},
-                                   aerialway = {'pylon', 'no'},
-                                   aeroway = {'no'},
-                                   amenity = {'no', 'parking_space', 'parking_entrance',
-                                              'waste_disposal', 'hunting_stand'},
-                                   club = {'no'},
-                                   craft = {'no'},
-                                   leisure = {'no'},
-                                   office = {'no'},
-                                   mountain_pass = {'no'},
-                                   shop = {'no'},
-                                   tourism = {'yes', 'no'},
-                                   bridge = {'no'},
-                                   tunnel = {'no'},
-                                   waterway = {'riverbank'},
-                                   building = {'no'},
-                                   boundary = {'place', 'land_area'}},
-                    extra_keys = {'*:prefix', '*:suffix', 'name:prefix:*', 'name:suffix:*',
-                               'name:etymology', 'name:signed', 'name:botanical',
-                               'wikidata', '*:wikidata',
-                               '*:wikipedia', 'brand:wikipedia:*',
-                               'addr:street:name', 'addr:street:type'}
-                   }
-
-flex.set_name_tags{main = {'name', 'name:*',
-                          'int_name', 'int_name:*',
-                          'nat_name', 'nat_name:*',
-                          'reg_name', 'reg_name:*',
-                          'loc_name', 'loc_name:*',
-                          'old_name', 'old_name:*',
-                          'alt_name', 'alt_name:*', 'alt_name_*',
-                          'official_name', 'official_name:*',
-                          'place_name', 'place_name:*',
-                          'short_name', 'short_name:*', 'brand'},
-                   extra = {'ref', 'int_ref', 'nat_ref', 'reg_ref',
-                            'loc_ref', 'old_ref',
-                            'iata', 'icao', 'pcode', 'pcode:*', 'ISO3166-2'},
-                   house = {'addr:housename'}
-                  }
-
-flex.set_address_tags{main = {'addr:housenumber',
-                              'addr:conscriptionnumber',
-                              'addr:streetnumber'},
-                      extra = {'addr:*', 'is_in:*', 'tiger:county'},
-                      postcode = {'postal_code', 'postcode', 'addr:postcode',
-                                  'tiger:zip_left', 'tiger:zip_right'},
-                      country = {'country_code', 'ISO3166-1',
-                                 'addr:country_code', 'is_in:country_code',
-                                 'addr:country', 'is_in:country'},
-                      interpolation = {'addr:interpolation'}
-                     }
-
-
-flex.set_unused_handling{delete_keys = {'tiger:*'}}
-
-return flex
diff --git a/settings/import-full.lua b/settings/import-full.lua
deleted file mode 100644
index 11bd1f3a..00000000
--- a/settings/import-full.lua
+++ /dev/null
@@ -1,126 +0,0 @@
-local flex = require('flex-base')
-
-flex.set_main_tags{
-    building = 'fallback',
-    emergency = 'always',
-    healthcare = 'fallback',
-    historic = 'always',
-    military = 'always',
-    natural = 'named',
-    highway = {'always',
-               street_lamp = 'named',
-               traffic_signals = 'named',
-               service = 'named',
-               cycleway = 'named',
-               path = 'named',
-               footway = 'named',
-               steps = 'named',
-               bridleway = 'named',
-               track = 'named',
-               motorway_link = 'named',
-               trunk_link = 'named',
-               primary_link = 'named',
-               secondary_link = 'named',
-               tertiary_link = 'named'},
-    railway = 'named',
-    man_made = {'none',
-                pier = 'always',
-                tower = 'always',
-                bridge = 'always',
-                works = 'named',
-                water_tower = 'always',
-                dyke = 'named',
-                adit = 'named',
-                lighthouse = 'always',
-                watermill = 'always',
-                tunnel = 'always'},
-    aerialway = 'always',
-    boundary = {'named',
-                postal_code = 'always'},
-    aeroway = 'always',
-    amenity = 'always',
-    club = 'always',
-    craft = 'always',
-    junction = 'fallback',
-    landuse = 'fallback',
-    leisure = {'always',
-               nature_reserve = 'fallback'},
-    office = 'always',
-    mountain_pass = 'always',
-    shop = 'always',
-    tourism = 'always',
-    bridge = 'named_with_key',
-    tunnel = 'named_with_key',
-    waterway = 'named',
-    place = 'always'
-}
-
-flex.set_prefilters{delete_keys = {'note', 'note:*', 'source', '*source', 'attribution',
-                                   'comment', 'fixme', 'FIXME', 'created_by', 'NHD:*',
-                                   'nhd:*', 'gnis:*', 'geobase:*', 'KSJ2:*', 'yh:*',
-                                   'osak:*', 'naptan:*', 'CLC:*', 'import', 'it:fvg:*',
-                                   'type', 'lacounty:*', 'ref:ruian:*', 'building:ruian:type',
-                                   'ref:linz:*', 'is_in:postcode',
-                                   '*:prefix', '*:suffix', 'name:prefix:*', 'name:suffix:*',
-                                   'name:etymology', 'name:signed', 'name:botanical',
-                                   '*:wikidata', '*:wikipedia', 'brand:wikipedia:*',
-                                   'addr:street:name', 'addr:street:type'},
-                    delete_tags = {emergency = {'yes', 'no', 'fire_hydrant'},
-                                   historic = {'yes', 'no'},
-                                   military = {'yes', 'no'},
-                                   natural = {'yes', 'no', 'coastline'},
-                                   highway = {'no', 'turning_circle', 'mini_roundabout',
-                                              'noexit', 'crossing', 'give_way', 'stop'},
-                                   railway = {'level_crossing', 'no', 'rail', 'switch',
-                                              'abandoned', 'signal', 'buffer_stop', 'razed'},
-                                   aerialway = {'pylon', 'no'},
-                                   aeroway = {'no'},
-                                   amenity = {'no', 'parking_space', 'parking_entrance',
-                                              'waste_disposal', 'hunting_stand'},
-                                   club = {'no'},
-                                   craft = {'no'},
-                                   leisure = {'no'},
-                                   office = {'no'},
-                                   mountain_pass = {'no'},
-                                   shop = {'no'},
-                                   tourism = {'yes', 'no'},
-                                   bridge = {'no'},
-                                   tunnel = {'no'},
-                                   waterway = {'riverbank'},
-                                   building = {'no'},
-                                   boundary = {'place', 'land_area'}},
-                    extra_keys = {'wikidata', 'wikipedia', 'wikipedia:*'}
-                   }
-
-flex.set_name_tags{main = {'name', 'name:*',
-                          'int_name', 'int_name:*',
-                          'nat_name', 'nat_name:*',
-                          'reg_name', 'reg_name:*',
-                          'loc_name', 'loc_name:*',
-                          'old_name', 'old_name:*',
-                          'alt_name', 'alt_name:*', 'alt_name_*',
-                          'official_name', 'official_name:*',
-                          'place_name', 'place_name:*',
-                          'short_name', 'short_name:*', 'brand'},
-                   extra = {'ref', 'int_ref', 'nat_ref', 'reg_ref',
-                            'loc_ref', 'old_ref',
-                            'iata', 'icao', 'pcode', 'pcode:*', 'ISO3166-2'},
-                   house = {'addr:housename'}
-                  }
-
-flex.set_address_tags{main = {'addr:housenumber',
-                              'addr:conscriptionnumber',
-                              'addr:streetnumber'},
-                      extra = {'addr:*', 'is_in:*', 'tiger:county'},
-                      postcode = {'postal_code', 'postcode', 'addr:postcode',
-                                  'tiger:zip_left', 'tiger:zip_right'},
-                      country = {'country_code', 'ISO3166-1',
-                                 'addr:country_code', 'is_in:country_code',
-                                 'addr:country', 'is_in:country'},
-                      interpolation = {'addr:interpolation'}
-                     }
-
-
-flex.set_unused_handling{extra_keys = {'place'}}
-
-return flex
diff --git a/settings/import-street.lua b/settings/import-street.lua
deleted file mode 100644
index 60b76dfb..00000000
--- a/settings/import-street.lua
+++ /dev/null
@@ -1,74 +0,0 @@
-local flex = require('flex-base')
-
-flex.set_main_tags{
-    highway = {motorway = 'always',
-               trunk = 'always',
-               primary = 'always',
-               secondary = 'always',
-               tertiary = 'always',
-               unclassified = 'always',
-               residential = 'always',
-               road = 'always',
-               living_street = 'always',
-               pedestrian = 'always',
-               service = 'named',
-               cycleway = 'named',
-               path = 'named',
-               footway = 'named',
-               steps = 'named',
-               bridleway = 'named',
-               track = 'named',
-               motorway_link = 'named',
-               trunk_link = 'named',
-               primary_link = 'named',
-               secondary_link = 'named',
-               tertiary_link = 'named'},
-    boundary = {administrative = 'named',
-                postal_code = 'always'},
-    landuse = 'fallback',
-    place = 'always'
-}
-
-flex.set_prefilters{delete_keys = {'building', 'source',
-                                   'addr:housenumber', 'addr:street',
-                                   'source', '*source', 'type',
-                                   'is_in:postcode', '*:wikidata', '*:wikipedia',
-                                   '*:prefix', '*:suffix', 'name:prefix:*', 'name:suffix:*',
-                                   'name:etymology', 'name:signed', 'name:botanical',
-                                   'addr:street:name', 'addr:street:type'},
-                    delete_tags = {landuse = {'cemetry', 'no'},
-                                   boundary = {'place'}},
-                    extra_keys = {'wikipedia', 'wikipedia:*', 'wikidata', 'capital', 'area'}
-                   }
-
-flex.set_name_tags{main = {'name', 'name:*',
-                          'int_name', 'int_name:*',
-                          'nat_name', 'nat_name:*',
-                          'reg_name', 'reg_name:*',
-                          'loc_name', 'loc_name:*',
-                          'old_name', 'old_name:*',
-                          'alt_name', 'alt_name:*', 'alt_name_*',
-                          'official_name', 'official_name:*',
-                          'place_name', 'place_name:*',
-                          'short_name', 'short_name:*'},
-                   extra = {'ref', 'int_ref', 'nat_ref', 'reg_ref',
-                            'loc_ref', 'old_ref',
-                            'iata', 'icao', 'pcode', 'pcode:*', 'ISO3166-2'}
-                  }
-
-flex.set_address_tags{main = {'addr:housenumber',
-                              'addr:conscriptionnumber',
-                              'addr:streetnumber'},
-                      extra = {'addr:*', 'is_in:*', 'tiger:county'},
-                      postcode = {'postal_code', 'postcode', 'addr:postcode',
-                                  'tiger:zip_left', 'tiger:zip_right'},
-                      country = {'country_code', 'ISO3166-1',
-                                 'addr:country_code', 'is_in:country_code',
-                                 'addr:country', 'is_in:country'},
-                      interpolation = {'addr:interpolation'},
-                      postcode_fallback = false
-                     }
-
-flex.set_unused_handling{extra_keys = {'place'}}
-
-return flex
diff --git a/settings/taginfo.lua b/settings/taginfo.lua
deleted file mode 100644
index ef2ad2a6..00000000
--- a/settings/taginfo.lua
+++ /dev/null
@@ -1,74 +0,0 @@
--- Prints taginfo project description in the standard output
---
-
--- create fake "osm2pgsql" table for flex-base, originally created by the main C++ program
-osm2pgsql = {}
-function osm2pgsql.define_table(...) end
-
--- provide path to flex-style lua file
-flex = require('import-extratags')
-local json = require ('dkjson')
-
-
------------- helper functions ---------------------
-
-function get_key_description(key, description)
-    local desc = {}
-    desc.key = key
-    desc.description = description
-    set_keyorder(desc, {'key', 'description'})
-    return desc
-end
-
--- Sets the key order for the resulting JSON table
-function set_keyorder(table, order)
-    setmetatable(table, {
-        __jsonorder = order
-    })
-end
-
-
--- Prints the collected tags in the required format in JSON
-function print_taginfo()
-    local tags = {}
-
-    for _, k in ipairs(flex.TAGINFO_MAIN.keys) do
-        local desc = get_key_description(k, 'POI/feature in the search database')
-        if flex.TAGINFO_MAIN.delete_tags[k] ~= nil then
-            desc.description = string.format('%s (except for values: %s).', desc.description,
-                                table.concat(flex.TAGINFO_MAIN.delete_tags[k], ', '))
-        end
-        table.insert(tags, desc)
-    end
-
-    for k, _ in pairs(flex.TAGINFO_NAME_KEYS) do
-        local desc = get_key_description(k, 'Searchable name of the place.')
-        table.insert(tags, desc)
-    end
-    for k, _ in pairs(flex.TAGINFO_ADDRESS_KEYS) do
-        local desc = get_key_description(k, 'Used to determine the address of a place.')
-        table.insert(tags, desc)
-    end
-
-    local format = {
-        data_format = 1,
-        data_url = 'https://nominatim.openstreetmap.org/taginfo.json',
-        project = {
-            name = 'Nominatim',
-            description = 'OSM search engine.',
-            project_url = 'https://nominatim.openstreetmap.org',
-            doc_url = 'https://nominatim.org/release-docs/develop/',
-            contact_name = 'Sarah Hoffmann',
-            contact_email = 'lonvia@denofr.de'
-        }
-    }
-    format.tags = tags
-
-    set_keyorder(format, {'data_format', 'data_url', 'project', 'tags'})
-    set_keyorder(format.project, {'name', 'description', 'project_url', 'doc_url',
-                    'contact_name', 'contact_email'})
-
-    print(json.encode(format))
-end
-
-print_taginfo()
diff --git a/src/nominatim_api/connection.py b/src/nominatim_api/connection.py
index e104745e..04268dc3 100644
--- a/src/nominatim_api/connection.py
+++ b/src/nominatim_api/connection.py
@@ -18,6 +18,7 @@ from .typing import SaFromClause
 from .sql.sqlalchemy_schema import SearchTables
 from .sql.sqlalchemy_types import Geometry
 from .logging import log
+from .config import Configuration
 
 T = TypeVar('T')
 
@@ -31,9 +32,11 @@ class SearchConnection:
 
     def __init__(self, conn: AsyncConnection,
                  tables: SearchTables,
-                 properties: Dict[str, Any]) -> None:
+                 properties: Dict[str, Any],
+                 config: Configuration) -> None:
         self.connection = conn
         self.t = tables
+        self.config = config
         self._property_cache = properties
         self._classtables: Optional[Set[str]] = None
         self.query_timeout: Optional[int] = None
diff --git a/src/nominatim_api/core.py b/src/nominatim_api/core.py
index 3cf9e989..f8941bcc 100644
--- a/src/nominatim_api/core.py
+++ b/src/nominatim_api/core.py
@@ -26,7 +26,7 @@ from .connection import SearchConnection
 from .status import get_status, StatusResult
 from .lookup import get_places, get_detailed_place
 from .reverse import ReverseGeocoder
-from .search import ForwardGeocoder, Phrase, PhraseType, make_query_analyzer
+from . import search as nsearch
 from . import types as ntyp
 from .results import DetailedResult, ReverseResult, SearchResults
 
@@ -184,7 +184,7 @@ class NominatimAPIAsync:
         assert self._tables is not None
 
         async with self._engine.begin() as conn:
-            yield SearchConnection(conn, self._tables, self._property_cache)
+            yield SearchConnection(conn, self._tables, self._property_cache, self.config)
 
     async def status(self) -> StatusResult:
         """ Return the status of the database.
@@ -207,7 +207,7 @@ class NominatimAPIAsync:
         async with self.begin() as conn:
             conn.set_query_timeout(self.query_timeout)
             if details.keywords:
-                await make_query_analyzer(conn)
+                await nsearch.make_query_analyzer(conn)
             return await get_detailed_place(conn, place, details)
 
     async def lookup(self, places: Sequence[ntyp.PlaceRef], **params: Any) -> SearchResults:
@@ -219,7 +219,7 @@ class NominatimAPIAsync:
         async with self.begin() as conn:
             conn.set_query_timeout(self.query_timeout)
             if details.keywords:
-                await make_query_analyzer(conn)
+                await nsearch.make_query_analyzer(conn)
             return await get_places(conn, places, details)
 
     async def reverse(self, coord: ntyp.AnyPoint, **params: Any) -> Optional[ReverseResult]:
@@ -237,7 +237,7 @@ class NominatimAPIAsync:
         async with self.begin() as conn:
             conn.set_query_timeout(self.query_timeout)
             if details.keywords:
-                await make_query_analyzer(conn)
+                await nsearch.make_query_analyzer(conn)
             geocoder = ReverseGeocoder(conn, details,
                                        self.reverse_restrict_to_country_area)
             return await geocoder.lookup(coord)
@@ -251,10 +251,10 @@ class NominatimAPIAsync:
 
         async with self.begin() as conn:
             conn.set_query_timeout(self.query_timeout)
-            geocoder = ForwardGeocoder(conn, ntyp.SearchDetails.from_kwargs(params),
-                                       self.config.get_int('REQUEST_TIMEOUT')
-                                       if self.config.REQUEST_TIMEOUT else None)
-            phrases = [Phrase(PhraseType.NONE, p.strip()) for p in query.split(',')]
+            geocoder = nsearch.ForwardGeocoder(conn, ntyp.SearchDetails.from_kwargs(params),
+                                               self.config.get_int('REQUEST_TIMEOUT')
+                                               if self.config.REQUEST_TIMEOUT else None)
+            phrases = [nsearch.Phrase(nsearch.PHRASE_ANY, p.strip()) for p in query.split(',')]
             return await geocoder.lookup(phrases)
 
     async def search_address(self, amenity: Optional[str] = None,
@@ -271,22 +271,22 @@ class NominatimAPIAsync:
             conn.set_query_timeout(self.query_timeout)
             details = ntyp.SearchDetails.from_kwargs(params)
 
-            phrases: List[Phrase] = []
+            phrases: List[nsearch.Phrase] = []
 
             if amenity:
-                phrases.append(Phrase(PhraseType.AMENITY, amenity))
+                phrases.append(nsearch.Phrase(nsearch.PHRASE_AMENITY, amenity))
             if street:
-                phrases.append(Phrase(PhraseType.STREET, street))
+                phrases.append(nsearch.Phrase(nsearch.PHRASE_STREET, street))
             if city:
-                phrases.append(Phrase(PhraseType.CITY, city))
+                phrases.append(nsearch.Phrase(nsearch.PHRASE_CITY, city))
             if county:
-                phrases.append(Phrase(PhraseType.COUNTY, county))
+                phrases.append(nsearch.Phrase(nsearch.PHRASE_COUNTY, county))
             if state:
-                phrases.append(Phrase(PhraseType.STATE, state))
+                phrases.append(nsearch.Phrase(nsearch.PHRASE_STATE, state))
             if postalcode:
-                phrases.append(Phrase(PhraseType.POSTCODE, postalcode))
+                phrases.append(nsearch.Phrase(nsearch.PHRASE_POSTCODE, postalcode))
             if country:
-                phrases.append(Phrase(PhraseType.COUNTRY, country))
+                phrases.append(nsearch.Phrase(nsearch.PHRASE_COUNTRY, country))
 
             if not phrases:
                 raise UsageError('Nothing to search for.')
@@ -304,14 +304,14 @@ class NominatimAPIAsync:
             else:
                 details.restrict_min_max_rank(4, 4)
 
-            if 'layers' not in params:
+            if details.layers is None:
                 details.layers = ntyp.DataLayer.ADDRESS
                 if amenity:
                     details.layers |= ntyp.DataLayer.POI
 
-            geocoder = ForwardGeocoder(conn, details,
-                                       self.config.get_int('REQUEST_TIMEOUT')
-                                       if self.config.REQUEST_TIMEOUT else None)
+            geocoder = nsearch.ForwardGeocoder(conn, details,
+                                               self.config.get_int('REQUEST_TIMEOUT')
+                                               if self.config.REQUEST_TIMEOUT else None)
             return await geocoder.lookup(phrases)
 
     async def search_category(self, categories: List[Tuple[str, str]],
@@ -328,15 +328,15 @@ class NominatimAPIAsync:
         async with self.begin() as conn:
             conn.set_query_timeout(self.query_timeout)
             if near_query:
-                phrases = [Phrase(PhraseType.NONE, p) for p in near_query.split(',')]
+                phrases = [nsearch.Phrase(nsearch.PHRASE_ANY, p) for p in near_query.split(',')]
             else:
                 phrases = []
                 if details.keywords:
-                    await make_query_analyzer(conn)
+                    await nsearch.make_query_analyzer(conn)
 
-            geocoder = ForwardGeocoder(conn, details,
-                                       self.config.get_int('REQUEST_TIMEOUT')
-                                       if self.config.REQUEST_TIMEOUT else None)
+            geocoder = nsearch.ForwardGeocoder(conn, details,
+                                               self.config.get_int('REQUEST_TIMEOUT')
+                                               if self.config.REQUEST_TIMEOUT else None)
             return await geocoder.lookup_pois(categories, phrases)
 
 
diff --git a/src/nominatim_api/localization.py b/src/nominatim_api/localization.py
index bbf9225b..3414286e 100644
--- a/src/nominatim_api/localization.py
+++ b/src/nominatim_api/localization.py
@@ -8,6 +8,7 @@
 Helper functions for localizing names of results.
 """
 from typing import Mapping, List, Optional
+from .config import Configuration
 
 import re
 
@@ -20,14 +21,18 @@ class Locales:
     """
 
     def __init__(self, langs: Optional[List[str]] = None):
+        self.config = Configuration(None)
         self.languages = langs or []
         self.name_tags: List[str] = []
 
-        # Build the list of supported tags. It is currently hard-coded.
-        self._add_lang_tags('name')
-        self._add_tags('name', 'brand')
-        self._add_lang_tags('official_name', 'short_name')
-        self._add_tags('official_name', 'short_name', 'ref')
+        parts = self.config.OUTPUT_NAMES.split(',')
+
+        for part in parts:
+            part = part.strip()
+            if part.endswith(":XX"):
+                self._add_lang_tags(part[:-3])
+            else:
+                self._add_tags(part)
 
     def __bool__(self) -> bool:
         return len(self.languages) > 0
diff --git a/src/nominatim_api/logging.py b/src/nominatim_api/logging.py
index 1a6aef9b..64d43fdc 100644
--- a/src/nominatim_api/logging.py
+++ b/src/nominatim_api/logging.py
@@ -342,7 +342,8 @@ HTML_HEADER: str = """<!DOCTYPE html>
   <title>Nominatim - Debug</title>
   <style>
 """ + \
-    (HtmlFormatter(nobackground=True).get_style_defs('.highlight') if CODE_HIGHLIGHT else '') + \
+    (HtmlFormatter(nobackground=True).get_style_defs('.highlight')  # type: ignore[no-untyped-call]
+     if CODE_HIGHLIGHT else '') + \
     """
     h2 { font-size: x-large }
 
diff --git a/src/nominatim_api/query_preprocessing/__init__.py b/src/nominatim_api/query_preprocessing/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/src/nominatim_api/query_preprocessing/base.py b/src/nominatim_api/query_preprocessing/base.py
new file mode 100644
index 00000000..1e0afd05
--- /dev/null
+++ b/src/nominatim_api/query_preprocessing/base.py
@@ -0,0 +1,32 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2024 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Common data types and protocols for preprocessing.
+"""
+from typing import List, Callable
+
+from ..typing import Protocol
+from ..search import query as qmod
+from .config import QueryConfig
+
+QueryProcessingFunc = Callable[[List[qmod.Phrase]], List[qmod.Phrase]]
+
+
+class QueryHandler(Protocol):
+    """ Protocol for query modules.
+    """
+    def create(self, config: QueryConfig) -> QueryProcessingFunc:
+        """
+        Create a function for sanitizing a place.
+        Arguments:
+            config: A dictionary with the additional configuration options
+                    specified in the tokenizer configuration
+            normalizer: A instance to transliterate text
+        Return:
+            The result is a list modified by the preprocessor.
+        """
+        pass
diff --git a/src/nominatim_api/query_preprocessing/config.py b/src/nominatim_api/query_preprocessing/config.py
new file mode 100644
index 00000000..1948945c
--- /dev/null
+++ b/src/nominatim_api/query_preprocessing/config.py
@@ -0,0 +1,34 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2024 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Configuration for Sanitizers.
+"""
+from typing import Any, TYPE_CHECKING
+from collections import UserDict
+
+# working around missing generics in Python < 3.8
+# See https://github.com/python/typing/issues/60#issuecomment-869757075
+if TYPE_CHECKING:
+    _BaseUserDict = UserDict[str, Any]
+else:
+    _BaseUserDict = UserDict
+
+
+class QueryConfig(_BaseUserDict):
+    """ The `QueryConfig` class is a read-only dictionary
+        with configuration options for the preprocessor.
+        In addition to the usual dictionary functions, the class provides
+        accessors to standard preprocessor options that are used by many of the
+        preprocessors.
+    """
+
+    def set_normalizer(self, normalizer: Any) -> 'QueryConfig':
+        """ Set the normalizer function to be used.
+        """
+        self['_normalizer'] = normalizer
+
+        return self
diff --git a/src/nominatim_api/query_preprocessing/normalize.py b/src/nominatim_api/query_preprocessing/normalize.py
new file mode 100644
index 00000000..0bb0c8ed
--- /dev/null
+++ b/src/nominatim_api/query_preprocessing/normalize.py
@@ -0,0 +1,31 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2024 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Normalize query text using the same ICU normalization rules that are
+applied during import. If a phrase becomes empty because the normalization
+removes all terms, then the phrase is deleted.
+
+This preprocessor does not come with any extra information. Instead it will
+use the configuration from the `normalization` section.
+"""
+from typing import cast
+
+from .config import QueryConfig
+from .base import QueryProcessingFunc
+from ..search.query import Phrase
+
+
+def create(config: QueryConfig) -> QueryProcessingFunc:
+    normalizer = config.get('_normalizer')
+
+    if not normalizer:
+        return lambda p: p
+
+    return lambda phrases: list(
+        filter(lambda p: p.text,
+               (Phrase(p.ptype, cast(str, normalizer.transliterate(p.text)).strip('-: '))
+                for p in phrases)))
diff --git a/src/nominatim_api/query_preprocessing/regex_replace.py b/src/nominatim_api/query_preprocessing/regex_replace.py
new file mode 100644
index 00000000..b3a02495
--- /dev/null
+++ b/src/nominatim_api/query_preprocessing/regex_replace.py
@@ -0,0 +1,52 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+This preprocessor replaces values in a given input based on pre-defined regex rules.
+
+Arguments:
+    pattern: Regex pattern to be applied on the input
+    replace: The string that it is to be replaced with
+"""
+from typing import List
+import re
+
+from .config import QueryConfig
+from .base import QueryProcessingFunc
+from ..search.query import Phrase
+
+
+class _GenericPreprocessing:
+    """Perform replacements to input phrases using custom regex patterns."""
+
+    def __init__(self, config: QueryConfig) -> None:
+        """Initialise the _GenericPreprocessing class with patterns from the ICU config file."""
+        self.config = config
+
+        match_patterns = self.config.get('replacements', 'Key not found')
+        self.compiled_patterns = [
+            (re.compile(item['pattern']), item['replace']) for item in match_patterns
+            ]
+
+    def split_phrase(self, phrase: Phrase) -> Phrase:
+        """This function performs replacements on the given text using regex patterns."""
+        for item in self.compiled_patterns:
+            phrase.text = item[0].sub(item[1], phrase.text)
+
+        return phrase
+
+    def __call__(self, phrases: List[Phrase]) -> List[Phrase]:
+        """
+        Return the final Phrase list.
+        Returns an empty list if there is nothing left after split_phrase.
+        """
+        result = [p for p in map(self.split_phrase, phrases) if p.text.strip()]
+        return result
+
+
+def create(config: QueryConfig) -> QueryProcessingFunc:
+    """ Create a function for generic preprocessing."""
+    return _GenericPreprocessing(config)
diff --git a/src/nominatim_api/query_preprocessing/split_japanese_phrases.py b/src/nominatim_api/query_preprocessing/split_japanese_phrases.py
new file mode 100644
index 00000000..7ab55b5f
--- /dev/null
+++ b/src/nominatim_api/query_preprocessing/split_japanese_phrases.py
@@ -0,0 +1,61 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+This file divides Japanese addresses into three categories:
+prefecture, municipality, and other.
+The division is not strict but simple using these keywords.
+"""
+from typing import List
+import re
+
+from .config import QueryConfig
+from .base import QueryProcessingFunc
+from ..search.query import Phrase
+
+MATCH_PATTERNS = [
+    r'''
+                (...??[é½ï¨¦éåºçç¸£])            # [group1] prefecture
+                (.+?[å¸åºåçºæ])              # [group2] municipalities (city/wards/towns/villages)
+                (.+)                         # [group3] other words
+                ''',
+    r'''
+                (...??[é½ï¨¦éåºçç¸£])            # [group1] prefecture
+                (.+)                         # [group3] other words
+                ''',
+    r'''
+                (.+?[å¸åºåçºæ])              # [group2] municipalities (city/wards/towns/villages)
+                (.+)                         # [group3] other words
+                '''
+]
+
+
+class _JapanesePreprocessing:
+
+    def __init__(self, config: QueryConfig) -> None:
+        self.config = config
+
+    def split_phrase(self, phrase: Phrase) -> Phrase:
+        """
+        This function performs a division on the given text using a regular expression.
+        """
+        for pattern in MATCH_PATTERNS:
+            result = re.match(pattern, phrase.text, re.VERBOSE)
+            if result is not None:
+                return Phrase(phrase.ptype, ':'.join(result.groups()))
+
+        return phrase
+
+    def __call__(self, phrases: List[Phrase]) -> List[Phrase]:
+        """Split a Japanese address using japanese_tokenizer.
+        """
+        return [self.split_phrase(p) for p in phrases]
+
+
+def create(config: QueryConfig) -> QueryProcessingFunc:
+    """ Create a function of japanese preprocessing.
+    """
+    return _JapanesePreprocessing(config)
diff --git a/src/nominatim_api/reverse.py b/src/nominatim_api/reverse.py
index 1b06e659..c9f11b63 100644
--- a/src/nominatim_api/reverse.py
+++ b/src/nominatim_api/reverse.py
@@ -362,6 +362,8 @@ class ReverseGeocoder:
             # later only a minimum of results needs to be checked with ST_Contains.
             inner = sa.select(t, sa.literal(0.0).label('distance'))\
                       .where(t.c.rank_search.between(5, MAX_RANK_PARAM))\
+                      .where(t.c.rank_address != 5)\
+                      .where(t.c.rank_address != 11)\
                       .where(t.c.geometry.intersects(WKT_PARAM))\
                       .where(sa.func.PlacexGeometryReverseLookuppolygon())\
                       .order_by(sa.desc(t.c.rank_search))\
@@ -478,14 +480,15 @@ class ReverseGeocoder:
         log().var_dump('Country codes', ccodes)
         return ccodes
 
-    async def lookup_country(self, ccodes: List[str]) -> Optional[SaRow]:
+    async def lookup_country(self, ccodes: List[str]) -> Tuple[Optional[SaRow], RowFunc]:
         """ Lookup the country for the current search.
         """
+        row_func = nres.create_from_placex_row
         if not ccodes:
             ccodes = await self.lookup_country_codes()
 
         if not ccodes:
-            return None
+            return None, row_func
 
         t = self.conn.t.placex
         if self.max_rank > 4:
@@ -537,7 +540,32 @@ class ReverseGeocoder:
 
             address_row = (await self.conn.execute(sql, self.bind_params)).one_or_none()
 
-        return address_row
+        if address_row is None:
+            # finally fall back to country table
+            t = self.conn.t.country_name
+            tgrid = self.conn.t.country_grid
+
+            sql = sa.select(tgrid.c.country_code,
+                            tgrid.c.geometry.ST_Centroid().ST_Collect().ST_Centroid()
+                                 .label('centroid'),
+                            tgrid.c.geometry.ST_Collect().ST_Expand(0).label('bbox'))\
+                    .where(tgrid.c.country_code.in_(ccodes))\
+                    .group_by(tgrid.c.country_code)
+
+            sub = sql.subquery('grid')
+            sql = sa.select(t.c.country_code,
+                            t.c.name.merge(t.c.derived_name).label('name'),
+                            sub.c.centroid, sub.c.bbox)\
+                    .join(sub, t.c.country_code == sub.c.country_code)\
+                    .order_by(t.c.country_code)\
+                    .limit(1)
+
+            sql = self._add_geometry_columns(sql, sub.c.centroid)
+
+            address_row = (await self.conn.execute(sql, self.bind_params)).one_or_none()
+            row_func = nres.create_from_country_row
+
+        return address_row, row_func
 
     async def lookup(self, coord: AnyPoint) -> Optional[nres.ReverseResult]:
         """ Look up a single coordinate. Returns the place information,
@@ -566,12 +594,12 @@ class ReverseGeocoder:
             if self.max_rank > 4:
                 row = await self.lookup_area()
             if row is None and self.layer_enabled(DataLayer.ADDRESS):
-                row = await self.lookup_country(ccodes)
+                row, row_func = await self.lookup_country(ccodes)
 
         result = row_func(row, nres.ReverseResult)
         if result is not None:
             assert row is not None
-            result.distance = row.distance
+            result.distance = getattr(row,  'distance', 0)
             if hasattr(row, 'bbox'):
                 result.bbox = Bbox.from_wkb(row.bbox)
             await nres.add_result_details(self.conn, [result], self.params)
diff --git a/src/nominatim_api/search/__init__.py b/src/nominatim_api/search/__init__.py
index 956d91d8..c7312e23 100644
--- a/src/nominatim_api/search/__init__.py
+++ b/src/nominatim_api/search/__init__.py
@@ -9,5 +9,12 @@ Module for forward search.
 """
 from .geocoder import (ForwardGeocoder as ForwardGeocoder)
 from .query import (Phrase as Phrase,
-                    PhraseType as PhraseType)
+                    PHRASE_ANY as PHRASE_ANY,
+                    PHRASE_AMENITY as PHRASE_AMENITY,
+                    PHRASE_STREET as PHRASE_STREET,
+                    PHRASE_CITY as PHRASE_CITY,
+                    PHRASE_COUNTY as PHRASE_COUNTY,
+                    PHRASE_STATE as PHRASE_STATE,
+                    PHRASE_POSTCODE as PHRASE_POSTCODE,
+                    PHRASE_COUNTRY as PHRASE_COUNTRY)
 from .query_analyzer_factory import (make_query_analyzer as make_query_analyzer)
diff --git a/src/nominatim_api/search/db_search_builder.py b/src/nominatim_api/search/db_search_builder.py
index 1fbb7168..de85cefa 100644
--- a/src/nominatim_api/search/db_search_builder.py
+++ b/src/nominatim_api/search/db_search_builder.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Conversion from token assignment to an abstract DB search.
@@ -11,7 +11,7 @@ from typing import Optional, List, Tuple, Iterator, Dict
 import heapq
 
 from ..types import SearchDetails, DataLayer
-from .query import QueryStruct, Token, TokenType, TokenRange, BreakType
+from . import query as qmod
 from .token_assignment import TokenAssignment
 from . import db_search_fields as dbf
 from . import db_searches as dbs
@@ -51,7 +51,7 @@ class SearchBuilder:
     """ Build the abstract search queries from token assignments.
     """
 
-    def __init__(self, query: QueryStruct, details: SearchDetails) -> None:
+    def __init__(self, query: qmod.QueryStruct, details: SearchDetails) -> None:
         self.query = query
         self.details = details
 
@@ -97,7 +97,7 @@ class SearchBuilder:
                 builder = self.build_poi_search(sdata)
             elif assignment.housenumber:
                 hnr_tokens = self.query.get_tokens(assignment.housenumber,
-                                                   TokenType.HOUSENUMBER)
+                                                   qmod.TOKEN_HOUSENUMBER)
                 builder = self.build_housenumber_search(sdata, hnr_tokens, assignment.address)
             else:
                 builder = self.build_special_search(sdata, assignment.address,
@@ -128,7 +128,7 @@ class SearchBuilder:
             yield dbs.PoiSearch(sdata)
 
     def build_special_search(self, sdata: dbf.SearchData,
-                             address: List[TokenRange],
+                             address: List[qmod.TokenRange],
                              is_category: bool) -> Iterator[dbs.AbstractSearch]:
         """ Build abstract search queries for searches that do not involve
             a named place.
@@ -146,13 +146,12 @@ class SearchBuilder:
             if address:
                 sdata.lookups = [dbf.FieldLookup('nameaddress_vector',
                                                  [t.token for r in address
-                                                  for t in self.query.get_partials_list(r)],
+                                                  for t in self.query.iter_partials(r)],
                                                  lookups.Restrict)]
-                penalty += 0.2
             yield dbs.PostcodeSearch(penalty, sdata)
 
-    def build_housenumber_search(self, sdata: dbf.SearchData, hnrs: List[Token],
-                                 address: List[TokenRange]) -> Iterator[dbs.AbstractSearch]:
+    def build_housenumber_search(self, sdata: dbf.SearchData, hnrs: List[qmod.Token],
+                                 address: List[qmod.TokenRange]) -> Iterator[dbs.AbstractSearch]:
         """ Build a simple address search for special entries where the
             housenumber is the main name token.
         """
@@ -160,7 +159,7 @@ class SearchBuilder:
         expected_count = sum(t.count for t in hnrs)
 
         partials = {t.token: t.addr_count for trange in address
-                    for t in self.query.get_partials_list(trange)}
+                    for t in self.query.iter_partials(trange)}
 
         if not partials:
             # can happen when none of the partials is indexed
@@ -174,7 +173,7 @@ class SearchBuilder:
                                                  list(partials), lookups.LookupAll))
         else:
             addr_fulls = [t.token for t
-                          in self.query.get_tokens(address[0], TokenType.WORD)]
+                          in self.query.get_tokens(address[0], qmod.TOKEN_WORD)]
             if len(addr_fulls) > 5:
                 return
             sdata.lookups.append(
@@ -184,7 +183,7 @@ class SearchBuilder:
         yield dbs.PlaceSearch(0.05, sdata, expected_count)
 
     def build_name_search(self, sdata: dbf.SearchData,
-                          name: TokenRange, address: List[TokenRange],
+                          name: qmod.TokenRange, address: List[qmod.TokenRange],
                           is_category: bool) -> Iterator[dbs.AbstractSearch]:
         """ Build abstract search queries for simple name or address searches.
         """
@@ -197,19 +196,19 @@ class SearchBuilder:
                 sdata.lookups = lookup
                 yield dbs.PlaceSearch(penalty + name_penalty, sdata, count)
 
-    def yield_lookups(self, name: TokenRange, address: List[TokenRange]
+    def yield_lookups(self, name: qmod.TokenRange, address: List[qmod.TokenRange]
                       ) -> Iterator[Tuple[float, int, List[dbf.FieldLookup]]]:
         """ Yield all variants how the given name and address should best
             be searched for. This takes into account how frequent the terms
             are and tries to find a lookup that optimizes index use.
         """
         penalty = 0.0  # extra penalty
-        name_partials = {t.token: t for t in self.query.get_partials_list(name)}
+        name_partials = {t.token: t for t in self.query.iter_partials(name)}
 
-        addr_partials = [t for r in address for t in self.query.get_partials_list(r)]
+        addr_partials = [t for r in address for t in self.query.iter_partials(r)]
         addr_tokens = list({t.token for t in addr_partials})
 
-        exp_count = min(t.count for t in name_partials.values()) / (2**(len(name_partials) - 1))
+        exp_count = min(t.count for t in name_partials.values()) / (3**(len(name_partials) - 1))
 
         if (len(name_partials) > 3 or exp_count < 8000):
             yield penalty, exp_count, dbf.lookup_by_names(list(name_partials.keys()), addr_tokens)
@@ -217,7 +216,7 @@ class SearchBuilder:
 
         addr_count = min(t.addr_count for t in addr_partials) if addr_partials else 50000
         # Partial term to frequent. Try looking up by rare full names first.
-        name_fulls = self.query.get_tokens(name, TokenType.WORD)
+        name_fulls = self.query.get_tokens(name, qmod.TOKEN_WORD)
         if name_fulls:
             fulls_count = sum(t.count for t in name_fulls)
 
@@ -228,7 +227,7 @@ class SearchBuilder:
 
         # To catch remaining results, lookup by name and address
         # We only do this if there is a reasonable number of results expected.
-        exp_count = exp_count / (2**len(addr_tokens)) if addr_tokens else exp_count
+        exp_count /= 2**len(addr_tokens)
         if exp_count < 10000 and addr_count < 20000:
             penalty += 0.35 * max(1 if name_fulls else 0.1,
                                   5 - len(name_partials) - len(addr_tokens))
@@ -236,7 +235,7 @@ class SearchBuilder:
                 self.get_name_address_ranking(list(name_partials.keys()), addr_partials)
 
     def get_name_address_ranking(self, name_tokens: List[int],
-                                 addr_partials: List[Token]) -> List[dbf.FieldLookup]:
+                                 addr_partials: List[qmod.Token]) -> List[dbf.FieldLookup]:
         """ Create a ranking expression looking up by name and address.
         """
         lookup = [dbf.FieldLookup('name_vector', name_tokens, lookups.LookupAll)]
@@ -258,15 +257,13 @@ class SearchBuilder:
 
         return lookup
 
-    def get_full_name_ranking(self, name_fulls: List[Token], addr_partials: List[Token],
+    def get_full_name_ranking(self, name_fulls: List[qmod.Token], addr_partials: List[qmod.Token],
                               use_lookup: bool) -> List[dbf.FieldLookup]:
         """ Create a ranking expression with full name terms and
             additional address lookup. When 'use_lookup' is true, then
             address lookups will use the index, when the occurrences are not
             too many.
         """
-        # At this point drop unindexed partials from the address.
-        # This might yield wrong results, nothing we can do about that.
         if use_lookup:
             addr_restrict_tokens = []
             addr_lookup_tokens = [t.token for t in addr_partials]
@@ -277,19 +274,18 @@ class SearchBuilder:
         return dbf.lookup_by_any_name([t.token for t in name_fulls],
                                       addr_restrict_tokens, addr_lookup_tokens)
 
-    def get_name_ranking(self, trange: TokenRange,
+    def get_name_ranking(self, trange: qmod.TokenRange,
                          db_field: str = 'name_vector') -> dbf.FieldRanking:
         """ Create a ranking expression for a name term in the given range.
         """
-        name_fulls = self.query.get_tokens(trange, TokenType.WORD)
+        name_fulls = self.query.get_tokens(trange, qmod.TOKEN_WORD)
         ranks = [dbf.RankedTokens(t.penalty, [t.token]) for t in name_fulls]
         ranks.sort(key=lambda r: r.penalty)
         # Fallback, sum of penalty for partials
-        name_partials = self.query.get_partials_list(trange)
-        default = sum(t.penalty for t in name_partials) + 0.2
+        default = sum(t.penalty for t in self.query.iter_partials(trange)) + 0.2
         return dbf.FieldRanking(db_field, default, ranks)
 
-    def get_addr_ranking(self, trange: TokenRange) -> dbf.FieldRanking:
+    def get_addr_ranking(self, trange: qmod.TokenRange) -> dbf.FieldRanking:
         """ Create a list of ranking expressions for an address term
             for the given ranges.
         """
@@ -299,35 +295,35 @@ class SearchBuilder:
 
         while todo:
             neglen, pos, rank = heapq.heappop(todo)
+            # partial node
+            partial = self.query.nodes[pos].partial
+            if partial is not None:
+                if pos + 1 < trange.end:
+                    penalty = rank.penalty + partial.penalty \
+                              + PENALTY_WORDCHANGE[self.query.nodes[pos + 1].btype]
+                    heapq.heappush(todo, (neglen - 1, pos + 1,
+                                   dbf.RankedTokens(penalty, rank.tokens)))
+                else:
+                    ranks.append(dbf.RankedTokens(rank.penalty + partial.penalty,
+                                                  rank.tokens))
+            # full words
             for tlist in self.query.nodes[pos].starting:
-                if tlist.ttype in (TokenType.PARTIAL, TokenType.WORD):
+                if tlist.ttype == qmod.TOKEN_WORD:
                     if tlist.end < trange.end:
                         chgpenalty = PENALTY_WORDCHANGE[self.query.nodes[tlist.end].btype]
-                        if tlist.ttype == TokenType.PARTIAL:
-                            penalty = rank.penalty + chgpenalty \
-                                      + max(t.penalty for t in tlist.tokens)
+                        for t in tlist.tokens:
                             heapq.heappush(todo, (neglen - 1, tlist.end,
-                                                  dbf.RankedTokens(penalty, rank.tokens)))
-                        else:
-                            for t in tlist.tokens:
-                                heapq.heappush(todo, (neglen - 1, tlist.end,
-                                                      rank.with_token(t, chgpenalty)))
+                                                  rank.with_token(t, chgpenalty)))
                     elif tlist.end == trange.end:
-                        if tlist.ttype == TokenType.PARTIAL:
-                            ranks.append(dbf.RankedTokens(rank.penalty
-                                                          + max(t.penalty for t in tlist.tokens),
-                                                          rank.tokens))
-                        else:
-                            ranks.extend(rank.with_token(t, 0.0) for t in tlist.tokens)
-                        if len(ranks) >= 10:
-                            # Too many variants, bail out and only add
-                            # Worst-case Fallback: sum of penalty of partials
-                            name_partials = self.query.get_partials_list(trange)
-                            default = sum(t.penalty for t in name_partials) + 0.2
-                            ranks.append(dbf.RankedTokens(rank.penalty + default, []))
-                            # Bail out of outer loop
-                            todo.clear()
-                            break
+                        ranks.extend(rank.with_token(t, 0.0) for t in tlist.tokens)
+
+            if len(ranks) >= 10:
+                # Too many variants, bail out and only add
+                # Worst-case Fallback: sum of penalty of partials
+                default = sum(t.penalty for t in self.query.iter_partials(trange)) + 0.2
+                ranks.append(dbf.RankedTokens(rank.penalty + default, []))
+                # Bail out of outer loop
+                break
 
         ranks.sort(key=lambda r: len(r.tokens))
         default = ranks[0].penalty + 0.3
@@ -353,11 +349,11 @@ class SearchBuilder:
         if assignment.housenumber:
             sdata.set_strings('housenumbers',
                               self.query.get_tokens(assignment.housenumber,
-                                                    TokenType.HOUSENUMBER))
+                                                    qmod.TOKEN_HOUSENUMBER))
         if assignment.postcode:
             sdata.set_strings('postcodes',
                               self.query.get_tokens(assignment.postcode,
-                                                    TokenType.POSTCODE))
+                                                    qmod.TOKEN_POSTCODE))
         if assignment.qualifier:
             tokens = self.get_qualifier_tokens(assignment.qualifier)
             if not tokens:
@@ -382,23 +378,23 @@ class SearchBuilder:
 
         return sdata
 
-    def get_country_tokens(self, trange: TokenRange) -> List[Token]:
+    def get_country_tokens(self, trange: qmod.TokenRange) -> List[qmod.Token]:
         """ Return the list of country tokens for the given range,
             optionally filtered by the country list from the details
             parameters.
         """
-        tokens = self.query.get_tokens(trange, TokenType.COUNTRY)
+        tokens = self.query.get_tokens(trange, qmod.TOKEN_COUNTRY)
         if self.details.countries:
             tokens = [t for t in tokens if t.lookup_word in self.details.countries]
 
         return tokens
 
-    def get_qualifier_tokens(self, trange: TokenRange) -> List[Token]:
+    def get_qualifier_tokens(self, trange: qmod.TokenRange) -> List[qmod.Token]:
         """ Return the list of qualifier tokens for the given range,
             optionally filtered by the qualifier list from the details
             parameters.
         """
-        tokens = self.query.get_tokens(trange, TokenType.QUALIFIER)
+        tokens = self.query.get_tokens(trange, qmod.TOKEN_QUALIFIER)
         if self.details.categories:
             tokens = [t for t in tokens if t.get_category() in self.details.categories]
 
@@ -411,7 +407,7 @@ class SearchBuilder:
         """
         if assignment.near_item:
             tokens: Dict[Tuple[str, str], float] = {}
-            for t in self.query.get_tokens(assignment.near_item, TokenType.NEAR_ITEM):
+            for t in self.query.get_tokens(assignment.near_item, qmod.TOKEN_NEAR_ITEM):
                 cat = t.get_category()
                 # The category of a near search will be that of near_item.
                 # Thus, if search is restricted to a category parameter,
@@ -425,10 +421,11 @@ class SearchBuilder:
 
 
 PENALTY_WORDCHANGE = {
-    BreakType.START: 0.0,
-    BreakType.END: 0.0,
-    BreakType.PHRASE: 0.0,
-    BreakType.WORD: 0.1,
-    BreakType.PART: 0.2,
-    BreakType.TOKEN: 0.4
+    qmod.BREAK_START: 0.0,
+    qmod.BREAK_END: 0.0,
+    qmod.BREAK_PHRASE: 0.0,
+    qmod.BREAK_SOFT_PHRASE: 0.0,
+    qmod.BREAK_WORD: 0.1,
+    qmod.BREAK_PART: 0.2,
+    qmod.BREAK_TOKEN: 0.4
 }
diff --git a/src/nominatim_api/search/db_searches.py b/src/nominatim_api/search/db_searches.py
index 3a4c826f..8e37c748 100644
--- a/src/nominatim_api/search/db_searches.py
+++ b/src/nominatim_api/search/db_searches.py
@@ -581,9 +581,13 @@ class PostcodeSearch(AbstractSearch):
                      .where((tsearch.c.name_vector + tsearch.c.nameaddress_vector)
                             .contains(sa.type_coerce(self.lookups[0].tokens,
                                                      IntArray)))
+            # Do NOT add rerank penalties based on the address terms.
+            # The standard rerank penalty only checks the address vector
+            # while terms may appear in name and address vector. This would
+            # lead to overly high penalties.
+            # We assume that a postcode is precise enough to not require
+            # additional full name matches.
 
-        for ranking in self.rankings:
-            penalty += ranking.sql_penalty(conn.t.search_name)
         penalty += sa.case(*((t.c.postcode == v, p) for v, p in self.postcodes),
                            else_=1.0)
 
diff --git a/src/nominatim_api/search/geocoder.py b/src/nominatim_api/search/geocoder.py
index efe5b721..5fefe5ea 100644
--- a/src/nominatim_api/search/geocoder.py
+++ b/src/nominatim_api/search/geocoder.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Public interface to the search code.
@@ -50,6 +50,9 @@ class ForwardGeocoder:
             self.query_analyzer = await make_query_analyzer(self.conn)
 
         query = await self.query_analyzer.analyze_query(phrases)
+        query.compute_direction_penalty()
+        log().var_dump('Query direction penalty',
+                       lambda: f"[{'LR' if query.dir_penalty < 0 else 'RL'}] {query.dir_penalty}")
 
         searches: List[AbstractSearch] = []
         if query.num_token_slots() > 0:
@@ -133,7 +136,7 @@ class ForwardGeocoder:
         """
         assert self.query_analyzer is not None
         qwords = [word for phrase in query.source
-                  for word in re.split('[, ]+', phrase.text) if word]
+                  for word in re.split('[-,: ]+', phrase.text) if word]
         if not qwords:
             return
 
@@ -146,7 +149,7 @@ class ForwardGeocoder:
             distance = 0.0
             norm = self.query_analyzer.normalize_text(' '.join((result.display_name,
                                                                 result.country_code or '')))
-            words = set((w for w in norm.split(' ') if w))
+            words = set((w for w in re.split('[-,: ]+', norm) if w))
             if not words:
                 continue
             for qword in qwords:
@@ -238,7 +241,7 @@ def _dump_searches(searches: List[AbstractSearch], query: QueryStruct,
         if not lk:
             return ''
 
-        return f"{lk.lookup_type}({lk.column}{tk(lk.tokens)})"
+        return f"{lk.lookup_type.__name__}({lk.column}{tk(lk.tokens)})"
 
     def fmt_cstr(c: Any) -> str:
         if not c:
diff --git a/src/nominatim_api/search/icu_tokenizer.py b/src/nominatim_api/search/icu_tokenizer.py
index c18dd8be..1cb34f72 100644
--- a/src/nominatim_api/search/icu_tokenizer.py
+++ b/src/nominatim_api/search/icu_tokenizer.py
@@ -2,64 +2,50 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Implementation of query analysis for the ICU tokenizer.
 """
-from typing import Tuple, Dict, List, Optional, NamedTuple, Iterator, Any, cast
-from collections import defaultdict
+from typing import Tuple, Dict, List, Optional, Iterator, Any, cast
 import dataclasses
 import difflib
+import re
+from itertools import zip_longest
 
 from icu import Transliterator
 
 import sqlalchemy as sa
 
+from ..errors import UsageError
 from ..typing import SaRow
 from ..sql.sqlalchemy_types import Json
 from ..connection import SearchConnection
 from ..logging import log
-from ..search import query as qmod
-from ..search.query_analyzer_factory import AbstractQueryAnalyzer
+from . import query as qmod
+from ..query_preprocessing.config import QueryConfig
+from ..query_preprocessing.base import QueryProcessingFunc
+from .query_analyzer_factory import AbstractQueryAnalyzer
+from .postcode_parser import PostcodeParser
 
 
 DB_TO_TOKEN_TYPE = {
-    'W': qmod.TokenType.WORD,
-    'w': qmod.TokenType.PARTIAL,
-    'H': qmod.TokenType.HOUSENUMBER,
-    'P': qmod.TokenType.POSTCODE,
-    'C': qmod.TokenType.COUNTRY
+    'W': qmod.TOKEN_WORD,
+    'w': qmod.TOKEN_PARTIAL,
+    'H': qmod.TOKEN_HOUSENUMBER,
+    'P': qmod.TOKEN_POSTCODE,
+    'C': qmod.TOKEN_COUNTRY
 }
 
-
-class QueryPart(NamedTuple):
-    """ Normalized and transliterated form of a single term in the query.
-        When the term came out of a split during the transliteration,
-        the normalized string is the full word before transliteration.
-        The word number keeps track of the word before transliteration
-        and can be used to identify partial transliterated terms.
-    """
-    token: str
-    normalized: str
-    word_number: int
-
-
-QueryParts = List[QueryPart]
-WordDict = Dict[str, List[qmod.TokenRange]]
-
-
-def yield_words(terms: List[QueryPart], start: int) -> Iterator[Tuple[str, qmod.TokenRange]]:
-    """ Return all combinations of words in the terms list after the
-        given position.
-    """
-    total = len(terms)
-    for first in range(start, total):
-        word = terms[first].token
-        yield word, qmod.TokenRange(first, first + 1)
-        for last in range(first + 1, min(first + 20, total)):
-            word = ' '.join((word, terms[last].token))
-            yield word, qmod.TokenRange(first, last + 1)
+PENALTY_IN_TOKEN_BREAK = {
+     qmod.BREAK_START: 0.5,
+     qmod.BREAK_END: 0.5,
+     qmod.BREAK_PHRASE: 0.5,
+     qmod.BREAK_SOFT_PHRASE: 0.5,
+     qmod.BREAK_WORD: 0.1,
+     qmod.BREAK_PART: 0.0,
+     qmod.BREAK_TOKEN: 0.0
+}
 
 
 @dataclasses.dataclass
@@ -92,25 +78,25 @@ class ICUToken(qmod.Token):
         self.penalty += (distance/len(self.lookup_word))
 
     @staticmethod
-    def from_db_row(row: SaRow) -> 'ICUToken':
+    def from_db_row(row: SaRow, base_penalty: float = 0.0) -> 'ICUToken':
         """ Create a ICUToken from the row of the word table.
         """
         count = 1 if row.info is None else row.info.get('count', 1)
         addr_count = 1 if row.info is None else row.info.get('addr_count', 1)
 
-        penalty = 0.0
+        penalty = base_penalty
         if row.type == 'w':
-            penalty = 0.3
+            penalty += 0.3
         elif row.type == 'W':
             if len(row.word_token) == 1 and row.word_token == row.word:
-                penalty = 0.2 if row.word.isdigit() else 0.3
+                penalty += 0.2 if row.word.isdigit() else 0.3
         elif row.type == 'H':
-            penalty = sum(0.1 for c in row.word_token if c != ' ' and not c.isdigit())
+            penalty += sum(0.1 for c in row.word_token if c != ' ' and not c.isdigit())
             if all(not c.isdigit() for c in row.word_token):
                 penalty += 0.2 * (len(row.word_token) - 1)
         elif row.type == 'C':
             if len(row.word_token) == 1:
-                penalty = 0.3
+                penalty += 0.3
 
         if row.info is None:
             lookup_word = row.word
@@ -127,71 +113,99 @@ class ICUToken(qmod.Token):
                         addr_count=max(1, addr_count))
 
 
-class ICUQueryAnalyzer(AbstractQueryAnalyzer):
-    """ Converter for query strings into a tokenized query
-        using the tokens created by a ICU tokenizer.
-    """
-    def __init__(self, conn: SearchConnection) -> None:
-        self.conn = conn
+@dataclasses.dataclass
+class ICUAnalyzerConfig:
+    postcode_parser: PostcodeParser
+    normalizer: Transliterator
+    transliterator: Transliterator
+    preprocessors: List[QueryProcessingFunc]
 
-    async def setup(self) -> None:
-        """ Set up static data structures needed for the analysis.
-        """
-        async def _make_normalizer() -> Any:
-            rules = await self.conn.get_property('tokenizer_import_normalisation')
-            return Transliterator.createFromRules("normalization", rules)
+    @staticmethod
+    async def create(conn: SearchConnection) -> 'ICUAnalyzerConfig':
+        rules = await conn.get_property('tokenizer_import_normalisation')
+        normalizer = Transliterator.createFromRules("normalization", rules)
 
-        self.normalizer = await self.conn.get_cached_value('ICUTOK', 'normalizer',
-                                                           _make_normalizer)
+        rules = await conn.get_property('tokenizer_import_transliteration')
+        transliterator = Transliterator.createFromRules("transliteration", rules)
 
-        async def _make_transliterator() -> Any:
-            rules = await self.conn.get_property('tokenizer_import_transliteration')
-            return Transliterator.createFromRules("transliteration", rules)
+        preprocessing_rules = conn.config.load_sub_configuration('icu_tokenizer.yaml',
+                                                                 config='TOKENIZER_CONFIG')\
+                                         .get('query-preprocessing', [])
 
-        self.transliterator = await self.conn.get_cached_value('ICUTOK', 'transliterator',
-                                                               _make_transliterator)
+        preprocessors: List[QueryProcessingFunc] = []
+        for func in preprocessing_rules:
+            if 'step' not in func:
+                raise UsageError("Preprocessing rule is missing the 'step' attribute.")
+            if not isinstance(func['step'], str):
+                raise UsageError("'step' attribute must be a simple string.")
+
+            module = conn.config.load_plugin_module(
+                        func['step'], 'nominatim_api.query_preprocessing')
+            preprocessors.append(
+                module.create(QueryConfig(func).set_normalizer(normalizer)))
+
+        return ICUAnalyzerConfig(PostcodeParser(conn.config),
+                                 normalizer, transliterator, preprocessors)
 
-        if 'word' not in self.conn.t.meta.tables:
-            sa.Table('word', self.conn.t.meta,
-                     sa.Column('word_id', sa.Integer),
-                     sa.Column('word_token', sa.Text, nullable=False),
-                     sa.Column('type', sa.Text, nullable=False),
-                     sa.Column('word', sa.Text),
-                     sa.Column('info', Json))
+
+class ICUQueryAnalyzer(AbstractQueryAnalyzer):
+    """ Converter for query strings into a tokenized query
+        using the tokens created by a ICU tokenizer.
+    """
+    def __init__(self, conn: SearchConnection, config: ICUAnalyzerConfig) -> None:
+        self.conn = conn
+        self.postcode_parser = config.postcode_parser
+        self.normalizer = config.normalizer
+        self.transliterator = config.transliterator
+        self.preprocessors = config.preprocessors
 
     async def analyze_query(self, phrases: List[qmod.Phrase]) -> qmod.QueryStruct:
         """ Analyze the given list of phrases and return the
             tokenized query.
         """
         log().section('Analyze query (using ICU tokenizer)')
-        normalized = list(filter(lambda p: p.text,
-                                 (qmod.Phrase(p.ptype, self.normalize_text(p.text))
-                                  for p in phrases)))
-        query = qmod.QueryStruct(normalized)
+        for func in self.preprocessors:
+            phrases = func(phrases)
+
+        if len(phrases) == 1 \
+                and phrases[0].text.count(' ') > 3 \
+                and max(len(s) for s in phrases[0].text.split()) < 3:
+            normalized = []
+
+        query = qmod.QueryStruct(phrases)
+
         log().var_dump('Normalized query', query.source)
         if not query.source:
             return query
 
-        parts, words = self.split_query(query)
-        log().var_dump('Transliterated query', lambda: _dump_transliterated(query, parts))
+        self.split_query(query)
+        log().var_dump('Transliterated query', lambda: query.get_transliterated_query())
+        words = query.extract_words(base_penalty=PENALTY_IN_TOKEN_BREAK[qmod.BREAK_WORD])
 
         for row in await self.lookup_in_db(list(words.keys())):
             for trange in words[row.word_token]:
-                token = ICUToken.from_db_row(row)
+                token = ICUToken.from_db_row(row, trange.penalty or 0.0)
                 if row.type == 'S':
                     if row.info['op'] in ('in', 'near'):
                         if trange.start == 0:
-                            query.add_token(trange, qmod.TokenType.NEAR_ITEM, token)
+                            query.add_token(trange, qmod.TOKEN_NEAR_ITEM, token)
                     else:
                         if trange.start == 0 and trange.end == query.num_token_slots():
-                            query.add_token(trange, qmod.TokenType.NEAR_ITEM, token)
+                            query.add_token(trange, qmod.TOKEN_NEAR_ITEM, token)
                         else:
-                            query.add_token(trange, qmod.TokenType.QUALIFIER, token)
+                            query.add_token(trange, qmod.TOKEN_QUALIFIER, token)
                 else:
                     query.add_token(trange, DB_TO_TOKEN_TYPE[row.type], token)
 
-        self.add_extra_tokens(query, parts)
-        self.rerank_tokens(query, parts)
+        self.add_extra_tokens(query)
+        for start, end, pc in self.postcode_parser.parse(query):
+            term = ' '.join(n.term_lookup for n in query.nodes[start + 1:end + 1])
+            query.add_token(qmod.TokenRange(start, end),
+                            qmod.TOKEN_POSTCODE,
+                            ICUToken(penalty=0.1, token=0, count=1, addr_count=1,
+                                     lookup_word=pc, word_token=term,
+                                     info=None))
+        self.rerank_tokens(query)
 
         log().table_dump('Word tokens', _dump_word_tokens(query))
 
@@ -202,102 +216,108 @@ class ICUQueryAnalyzer(AbstractQueryAnalyzer):
             standardized form search will work with. All information removed
             at this stage is inevitably lost.
         """
-        norm = cast(str, self.normalizer.transliterate(text))
-        numspaces = norm.count(' ')
-        if numspaces > 4 and len(norm) <= (numspaces + 1) * 3:
-            return ''
+        return cast(str, self.normalizer.transliterate(text)).strip('-: ')
 
-        return norm
-
-    def split_query(self, query: qmod.QueryStruct) -> Tuple[QueryParts, WordDict]:
+    def split_query(self, query: qmod.QueryStruct) -> None:
         """ Transliterate the phrases and split them into tokens.
-
-            Returns the list of transliterated tokens together with their
-            normalized form and a dictionary of words for lookup together
-            with their position.
         """
-        parts: QueryParts = []
-        phrase_start = 0
-        words = defaultdict(list)
-        wordnr = 0
         for phrase in query.source:
             query.nodes[-1].ptype = phrase.ptype
-            for word in phrase.text.split(' '):
+            phrase_split = re.split('([ :-])', phrase.text)
+            # The zip construct will give us the pairs of word/break from
+            # the regular expression split. As the split array ends on the
+            # final word, we simply use the fillvalue to even out the list and
+            # add the phrase break at the end.
+            for word, breakchar in zip_longest(*[iter(phrase_split)]*2, fillvalue=','):
+                if not word:
+                    continue
                 trans = self.transliterator.transliterate(word)
                 if trans:
                     for term in trans.split(' '):
                         if term:
-                            parts.append(QueryPart(term, word, wordnr))
-                            query.add_node(qmod.BreakType.TOKEN, phrase.ptype)
-                    query.nodes[-1].btype = qmod.BreakType.WORD
-                wordnr += 1
-            query.nodes[-1].btype = qmod.BreakType.PHRASE
+                            query.add_node(qmod.BREAK_TOKEN, phrase.ptype,
+                                           PENALTY_IN_TOKEN_BREAK[qmod.BREAK_TOKEN],
+                                           term, word)
+                    query.nodes[-1].adjust_break(breakchar,
+                                                 PENALTY_IN_TOKEN_BREAK[breakchar])
 
-            for word, wrange in yield_words(parts, phrase_start):
-                words[word].append(wrange)
-
-            phrase_start = len(parts)
-        query.nodes[-1].btype = qmod.BreakType.END
-
-        return parts, words
+        query.nodes[-1].adjust_break(qmod.BREAK_END, PENALTY_IN_TOKEN_BREAK[qmod.BREAK_END])
 
     async def lookup_in_db(self, words: List[str]) -> 'sa.Result[Any]':
         """ Return the token information from the database for the
             given word tokens.
+
+            This function excludes postcode tokens
         """
         t = self.conn.t.meta.tables['word']
-        return await self.conn.execute(t.select().where(t.c.word_token.in_(words)))
+        return await self.conn.execute(t.select()
+                                        .where(t.c.word_token.in_(words))
+                                        .where(t.c.type != 'P'))
 
-    def add_extra_tokens(self, query: qmod.QueryStruct, parts: QueryParts) -> None:
+    def add_extra_tokens(self, query: qmod.QueryStruct) -> None:
         """ Add tokens to query that are not saved in the database.
         """
-        for part, node, i in zip(parts, query.nodes, range(1000)):
-            if len(part.token) <= 4 and part[0].isdigit()\
-               and not node.has_tokens(i+1, qmod.TokenType.HOUSENUMBER):
-                query.add_token(qmod.TokenRange(i, i+1), qmod.TokenType.HOUSENUMBER,
+        need_hnr = False
+        for i, node in enumerate(query.nodes):
+            is_full_token = node.btype not in (qmod.BREAK_TOKEN, qmod.BREAK_PART)
+            if need_hnr and is_full_token \
+                    and len(node.term_normalized) <= 4 and node.term_normalized.isdigit():
+                query.add_token(qmod.TokenRange(i-1, i), qmod.TOKEN_HOUSENUMBER,
                                 ICUToken(penalty=0.5, token=0,
-                                         count=1, addr_count=1, lookup_word=part.token,
-                                         word_token=part.token, info=None))
+                                         count=1, addr_count=1,
+                                         lookup_word=node.term_lookup,
+                                         word_token=node.term_lookup, info=None))
 
-    def rerank_tokens(self, query: qmod.QueryStruct, parts: QueryParts) -> None:
+            need_hnr = is_full_token and not node.has_tokens(i+1, qmod.TOKEN_HOUSENUMBER)
+
+    def rerank_tokens(self, query: qmod.QueryStruct) -> None:
         """ Add penalties to tokens that depend on presence of other token.
         """
-        for i, node, tlist in query.iter_token_lists():
-            if tlist.ttype == qmod.TokenType.POSTCODE:
-                for repl in node.starting:
-                    if repl.end == tlist.end and repl.ttype != qmod.TokenType.POSTCODE \
-                       and (repl.ttype != qmod.TokenType.HOUSENUMBER
-                            or len(tlist.tokens[0].lookup_word) > 4):
-                        repl.add_penalty(0.39)
-            elif (tlist.ttype == qmod.TokenType.HOUSENUMBER
-                  and len(tlist.tokens[0].lookup_word) <= 3):
-                if any(c.isdigit() for c in tlist.tokens[0].lookup_word):
-                    for repl in node.starting:
-                        if repl.end == tlist.end and repl.ttype != qmod.TokenType.HOUSENUMBER:
-                            repl.add_penalty(0.5 - tlist.tokens[0].penalty)
-            elif tlist.ttype not in (qmod.TokenType.COUNTRY, qmod.TokenType.PARTIAL):
-                norm = parts[i].normalized
-                for j in range(i + 1, tlist.end):
-                    if parts[j - 1].word_number != parts[j].word_number:
-                        norm += '  ' + parts[j].normalized
-                for token in tlist.tokens:
-                    cast(ICUToken, token).rematch(norm)
-
-
-def _dump_transliterated(query: qmod.QueryStruct, parts: QueryParts) -> str:
-    out = query.nodes[0].btype.value
-    for node, part in zip(query.nodes[1:], parts):
-        out += part.token + node.btype.value
-    return out
+        for start, end, tlist in query.iter_tokens_by_edge():
+            if len(tlist) > 1:
+                # If it looks like a Postcode, give preference.
+                if qmod.TOKEN_POSTCODE in tlist:
+                    for ttype, tokens in tlist.items():
+                        if ttype != qmod.TOKEN_POSTCODE and \
+                               (ttype != qmod.TOKEN_HOUSENUMBER or
+                                start + 1 > end or
+                                len(query.nodes[end].term_lookup) > 4):
+                            for token in tokens:
+                                token.penalty += 0.39
+
+                # If it looks like a simple housenumber, prefer that.
+                if qmod.TOKEN_HOUSENUMBER in tlist:
+                    hnr_lookup = tlist[qmod.TOKEN_HOUSENUMBER][0].lookup_word
+                    if len(hnr_lookup) <= 3 and any(c.isdigit() for c in hnr_lookup):
+                        penalty = 0.5 - tlist[qmod.TOKEN_HOUSENUMBER][0].penalty
+                        for ttype, tokens in tlist.items():
+                            if ttype != qmod.TOKEN_HOUSENUMBER:
+                                for token in tokens:
+                                    token.penalty += penalty
+
+            # rerank tokens against the normalized form
+            norm = ' '.join(n.term_normalized for n in query.nodes[start + 1:end + 1]
+                            if n.btype != qmod.BREAK_TOKEN)
+            if not norm:
+                # Can happen when the token only covers a partial term
+                norm = query.nodes[start + 1].term_normalized
+            for ttype, tokens in tlist.items():
+                if ttype != qmod.TOKEN_COUNTRY:
+                    for token in tokens:
+                        cast(ICUToken, token).rematch(norm)
 
 
 def _dump_word_tokens(query: qmod.QueryStruct) -> Iterator[List[Any]]:
-    yield ['type', 'token', 'word_token', 'lookup_word', 'penalty', 'count', 'info']
-    for node in query.nodes:
+    yield ['type', 'from', 'to', 'token', 'word_token', 'lookup_word', 'penalty', 'count', 'info']
+    for i, node in enumerate(query.nodes):
+        if node.partial is not None:
+            t = cast(ICUToken, node.partial)
+            yield [qmod.TOKEN_PARTIAL, str(i), str(i + 1), t.token,
+                   t.word_token, t.lookup_word, t.penalty, t.count, t.info]
         for tlist in node.starting:
             for token in tlist.tokens:
                 t = cast(ICUToken, token)
-                yield [tlist.ttype.name, t.token, t.word_token or '',
+                yield [tlist.ttype, str(i), str(tlist.end), t.token, t.word_token or '',
                        t.lookup_word or '', t.penalty, t.count, t.info]
 
 
@@ -305,7 +325,17 @@ async def create_query_analyzer(conn: SearchConnection) -> AbstractQueryAnalyzer
     """ Create and set up a new query analyzer for a database based
         on the ICU tokenizer.
     """
-    out = ICUQueryAnalyzer(conn)
-    await out.setup()
+    async def _get_config() -> ICUAnalyzerConfig:
+        if 'word' not in conn.t.meta.tables:
+            sa.Table('word', conn.t.meta,
+                     sa.Column('word_id', sa.Integer),
+                     sa.Column('word_token', sa.Text, nullable=False),
+                     sa.Column('type', sa.Text, nullable=False),
+                     sa.Column('word', sa.Text),
+                     sa.Column('info', Json))
+
+        return await ICUAnalyzerConfig.create(conn)
+
+    config = await conn.get_cached_value('ICUTOK', 'config', _get_config)
 
-    return out
+    return ICUQueryAnalyzer(conn, config)
diff --git a/src/nominatim_api/search/postcode_parser.py b/src/nominatim_api/search/postcode_parser.py
new file mode 100644
index 00000000..fb8b3804
--- /dev/null
+++ b/src/nominatim_api/search/postcode_parser.py
@@ -0,0 +1,104 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Handling of arbitrary postcode tokens in tokenized query string.
+"""
+from typing import Tuple, Set, Dict, List
+import re
+from collections import defaultdict
+
+import yaml
+
+from ..config import Configuration
+from . import query as qmod
+
+
+class PostcodeParser:
+    """ Pattern-based parser for postcodes in tokenized queries.
+
+        The postcode patterns are read from the country configuration.
+        The parser does currently not return country restrictions.
+    """
+
+    def __init__(self, config: Configuration) -> None:
+        # skip over includes here to avoid loading the complete country name data
+        yaml.add_constructor('!include', lambda loader, node: [],
+                             Loader=yaml.SafeLoader)
+        cdata = yaml.safe_load(config.find_config_file('country_settings.yaml')
+                                     .read_text(encoding='utf-8'))
+
+        unique_patterns: Dict[str, Dict[str, List[str]]] = {}
+        for cc, data in cdata.items():
+            if data.get('postcode'):
+                pat = data['postcode']['pattern'].replace('d', '[0-9]').replace('l', '[A-Z]')
+                out = data['postcode'].get('output')
+                if pat not in unique_patterns:
+                    unique_patterns[pat] = defaultdict(list)
+                unique_patterns[pat][out].append(cc.upper())
+
+        self.global_pattern = re.compile(
+                '(?:(?P<cc>[A-Z][A-Z])(?P<space>[ -]?))?(?P<pc>(?:(?:'
+                + ')|(?:'.join(unique_patterns) + '))[:, >].*)')
+
+        self.local_patterns = [(re.compile(f"{pat}[:, >]"), list(info.items()))
+                               for pat, info in unique_patterns.items()]
+
+    def parse(self, query: qmod.QueryStruct) -> Set[Tuple[int, int, str]]:
+        """ Parse postcodes in the given list of query tokens taking into
+            account the list of breaks from the nodes.
+
+            The result is a sequence of tuples with
+            [start node id, end node id, postcode token]
+        """
+        nodes = query.nodes
+        outcodes: Set[Tuple[int, int, str]] = set()
+
+        terms = [n.term_normalized.upper() + n.btype for n in nodes]
+        for i in range(query.num_token_slots()):
+            if nodes[i].btype in '<,: ' and nodes[i + 1].btype != '`' \
+                    and (i == 0 or nodes[i - 1].ptype != qmod.PHRASE_POSTCODE):
+                if nodes[i].ptype == qmod.PHRASE_ANY:
+                    word = terms[i + 1]
+                    if word[-1] in ' -' and nodes[i + 2].btype != '`' \
+                            and nodes[i + 1].ptype == qmod.PHRASE_ANY:
+                        word += terms[i + 2]
+                        if word[-1] in ' -' and nodes[i + 3].btype != '`' \
+                                and nodes[i + 2].ptype == qmod.PHRASE_ANY:
+                            word += terms[i + 3]
+
+                    self._match_word(word, i, False, outcodes)
+                elif nodes[i].ptype == qmod.PHRASE_POSTCODE:
+                    word = terms[i + 1]
+                    for j in range(i + 1, query.num_token_slots()):
+                        if nodes[j].ptype != qmod.PHRASE_POSTCODE:
+                            break
+                        word += terms[j + 1]
+
+                    self._match_word(word, i, True, outcodes)
+
+        return outcodes
+
+    def _match_word(self, word: str, pos: int, fullmatch: bool,
+                    outcodes: Set[Tuple[int, int, str]]) -> None:
+        # Use global pattern to check for presence of any postcode.
+        m = self.global_pattern.fullmatch(word)
+        if m:
+            # If there was a match, check against each pattern separately
+            # because multiple patterns might be machting at the end.
+            cc = m.group('cc')
+            pc_word = m.group('pc')
+            cc_spaces = len(m.group('space') or '')
+            for pattern, info in self.local_patterns:
+                lm = pattern.fullmatch(pc_word) if fullmatch else pattern.match(pc_word)
+                if lm:
+                    trange = (pos, pos + cc_spaces + sum(c in ' ,-:>' for c in lm.group(0)))
+                    for out, out_ccs in info:
+                        if cc is None or cc in out_ccs:
+                            if out:
+                                outcodes.add((*trange, lm.expand(out)))
+                            else:
+                                outcodes.add((*trange, lm.group(0)[:-1]))
diff --git a/src/nominatim_api/search/query.py b/src/nominatim_api/search/query.py
index 02ebbb5b..092bd586 100644
--- a/src/nominatim_api/search/query.py
+++ b/src/nominatim_api/search/query.py
@@ -2,93 +2,111 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Datastructures for a tokenized query.
 """
-from typing import List, Tuple, Optional, Iterator
+from typing import Dict, List, Tuple, Optional, Iterator
 from abc import ABC, abstractmethod
+from collections import defaultdict
 import dataclasses
-import enum
 
+# Precomputed denominator for the computation of the linear regression slope
+# used to determine the query direction.
+# The x value for the regression computation will be the position of the
+# token in the query. Thus we know the x values will be [0, query length).
+# As the denominator only depends on the x values, we can pre-compute here
+# the denominatior to use for a given query length.
+# Note that query length of two or less is special cased and will not use
+# the values from this array. Thus it is not a problem that they are 0.
+LINFAC = [i * (sum(si * si for si in range(i)) - (i - 1) * i * (i - 1) / 4)
+          for i in range(50)]
 
-class BreakType(enum.Enum):
-    """ Type of break between tokens.
-    """
-    START = '<'
-    """ Begin of the query. """
-    END = '>'
-    """ End of the query. """
-    PHRASE = ','
-    """ Break between two phrases. """
-    WORD = ' '
-    """ Break between words. """
-    PART = '-'
-    """ Break inside a word, for example a hyphen or apostrophe. """
-    TOKEN = '`'
-    """ Break created as a result of tokenization.
-        This may happen in languages without spaces between words.
-    """
+
+BreakType = str
+""" Type of break between tokens.
+"""
+BREAK_START = '<'
+""" Begin of the query. """
+BREAK_END = '>'
+""" End of the query. """
+BREAK_PHRASE = ','
+""" Hard break between two phrases. Address parts cannot cross hard
+    phrase boundaries."""
+BREAK_SOFT_PHRASE = ':'
+""" Likely break between two phrases. Address parts should not cross soft
+    phrase boundaries. Soft breaks can be inserted by a preprocessor
+    that is analysing the input string.
+"""
+BREAK_WORD = ' '
+""" Break between words. """
+BREAK_PART = '-'
+""" Break inside a word, for example a hyphen or apostrophe. """
+BREAK_TOKEN = '`'
+""" Break created as a result of tokenization.
+    This may happen in languages without spaces between words.
+"""
 
 
-class TokenType(enum.Enum):
-    """ Type of token.
-    """
-    WORD = enum.auto()
-    """ Full name of a place. """
-    PARTIAL = enum.auto()
-    """ Word term without breaks, does not necessarily represent a full name. """
-    HOUSENUMBER = enum.auto()
-    """ Housenumber term. """
-    POSTCODE = enum.auto()
-    """ Postal code term. """
-    COUNTRY = enum.auto()
-    """ Country name or reference. """
-    QUALIFIER = enum.auto()
-    """ Special term used together with name (e.g. _Hotel_ Bellevue). """
-    NEAR_ITEM = enum.auto()
-    """ Special term used as searchable object(e.g. supermarket in ...). """
-
-
-class PhraseType(enum.Enum):
-    """ Designation of a phrase.
+TokenType = str
+""" Type of token.
+"""
+TOKEN_WORD = 'W'
+""" Full name of a place. """
+TOKEN_PARTIAL = 'w'
+""" Word term without breaks, does not necessarily represent a full name. """
+TOKEN_HOUSENUMBER = 'H'
+""" Housenumber term. """
+TOKEN_POSTCODE = 'P'
+""" Postal code term. """
+TOKEN_COUNTRY = 'C'
+""" Country name or reference. """
+TOKEN_QUALIFIER = 'Q'
+""" Special term used together with name (e.g. _Hotel_ Bellevue). """
+TOKEN_NEAR_ITEM = 'N'
+""" Special term used as searchable object(e.g. supermarket in ...). """
+
+
+PhraseType = int
+""" Designation of a phrase.
+"""
+PHRASE_ANY = 0
+""" No specific designation (i.e. source is free-form query). """
+PHRASE_AMENITY = 1
+""" Contains name or type of a POI. """
+PHRASE_STREET = 2
+""" Contains a street name optionally with a housenumber. """
+PHRASE_CITY = 3
+""" Contains the postal city. """
+PHRASE_COUNTY = 4
+""" Contains the equivalent of a county. """
+PHRASE_STATE = 5
+""" Contains a state or province. """
+PHRASE_POSTCODE = 6
+""" Contains a postal code. """
+PHRASE_COUNTRY = 7
+""" Contains the country name or code. """
+
+
+def _phrase_compatible_with(ptype: PhraseType, ttype: TokenType,
+                            is_full_phrase: bool) -> bool:
+    """ Check if the given token type can be used with the phrase type.
     """
-    NONE = 0
-    """ No specific designation (i.e. source is free-form query). """
-    AMENITY = enum.auto()
-    """ Contains name or type of a POI. """
-    STREET = enum.auto()
-    """ Contains a street name optionally with a housenumber. """
-    CITY = enum.auto()
-    """ Contains the postal city. """
-    COUNTY = enum.auto()
-    """ Contains the equivalent of a county. """
-    STATE = enum.auto()
-    """ Contains a state or province. """
-    POSTCODE = enum.auto()
-    """ Contains a postal code. """
-    COUNTRY = enum.auto()
-    """ Contains the country name or code. """
-
-    def compatible_with(self, ttype: TokenType,
-                        is_full_phrase: bool) -> bool:
-        """ Check if the given token type can be used with the phrase type.
-        """
-        if self == PhraseType.NONE:
-            return not is_full_phrase or ttype != TokenType.QUALIFIER
-        if self == PhraseType.AMENITY:
-            return ttype in (TokenType.WORD, TokenType.PARTIAL)\
-                   or (is_full_phrase and ttype == TokenType.NEAR_ITEM)\
-                   or (not is_full_phrase and ttype == TokenType.QUALIFIER)
-        if self == PhraseType.STREET:
-            return ttype in (TokenType.WORD, TokenType.PARTIAL, TokenType.HOUSENUMBER)
-        if self == PhraseType.POSTCODE:
-            return ttype == TokenType.POSTCODE
-        if self == PhraseType.COUNTRY:
-            return ttype == TokenType.COUNTRY
-
-        return ttype in (TokenType.WORD, TokenType.PARTIAL)
+    if ptype == PHRASE_ANY:
+        return not is_full_phrase or ttype != TOKEN_QUALIFIER
+    if ptype == PHRASE_AMENITY:
+        return ttype in (TOKEN_WORD, TOKEN_PARTIAL)\
+               or (is_full_phrase and ttype == TOKEN_NEAR_ITEM)\
+               or (not is_full_phrase and ttype == TOKEN_QUALIFIER)
+    if ptype == PHRASE_STREET:
+        return ttype in (TOKEN_WORD, TOKEN_PARTIAL, TOKEN_HOUSENUMBER)
+    if ptype == PHRASE_POSTCODE:
+        return ttype == TOKEN_POSTCODE
+    if ptype == PHRASE_COUNTRY:
+        return ttype == TOKEN_COUNTRY
+
+    return ttype in (TOKEN_WORD, TOKEN_PARTIAL)
 
 
 @dataclasses.dataclass
@@ -116,6 +134,7 @@ class TokenRange:
     """
     start: int
     end: int
+    penalty: Optional[float] = None
 
     def __lt__(self, other: 'TokenRange') -> bool:
         return self.end <= other.start
@@ -164,10 +183,49 @@ class TokenList:
 @dataclasses.dataclass
 class QueryNode:
     """ A node of the query representing a break between terms.
+
+        The node also contains information on the source term
+        ending at the node. The tokens are created from this information.
     """
     btype: BreakType
     ptype: PhraseType
+
+    penalty: float
+    """ Penalty for the break at this node.
+    """
+    term_lookup: str
+    """ Transliterated term ending at this node.
+    """
+    term_normalized: str
+    """ Normalised form of term ending at this node.
+        When the token resulted from a split during transliteration,
+        then this string contains the complete source term.
+    """
+
     starting: List[TokenList] = dataclasses.field(default_factory=list)
+    """ List of all full tokens starting at this node.
+    """
+    partial: Optional[Token] = None
+    """ Base token going to the next node.
+        May be None when the query has parts for which no words are known.
+        Note that the query may still be parsable when there are other
+        types of tokens spanning over the gap.
+    """
+
+    def name_address_ratio(self) -> float:
+        """ Return the propability that the partial token belonging to
+            this node forms part of a name (as opposed of part of the address).
+        """
+        if self.partial is None:
+            return 0.5
+
+        return self.partial.count / (self.partial.count + self.partial.addr_count)
+
+    def adjust_break(self, btype: BreakType, penalty: float) -> None:
+        """ Change the break type and penalty for this node.
+        """
+        self.btype = btype
+        self.penalty = penalty
 
     def has_tokens(self, end: int, *ttypes: TokenType) -> bool:
         """ Check if there are tokens of the given types ending at the
@@ -204,26 +262,37 @@ class QueryStruct:
         need to be direct neighbours. Thus the query is represented as a
         directed acyclic graph.
 
+        A query also has a direction penalty 'dir_penalty'. This describes
+        the likelyhood if the query should be read from left-to-right or
+        vice versa. A negative 'dir_penalty' should be read as a penalty on
+        right-to-left reading, while a positive value represents a penalty
+        for left-to-right reading. The default value is 0, which is equivalent
+        to having no information about the reading.
+
         When created, a query contains a single node: the start of the
         query. Further nodes can be added by appending to 'nodes'.
     """
 
     def __init__(self, source: List[Phrase]) -> None:
         self.source = source
+        self.dir_penalty = 0.0
         self.nodes: List[QueryNode] = \
-            [QueryNode(BreakType.START, source[0].ptype if source else PhraseType.NONE)]
+            [QueryNode(BREAK_START, source[0].ptype if source else PHRASE_ANY,
+                       0.0, '', '')]
 
     def num_token_slots(self) -> int:
         """ Return the length of the query in vertice steps.
         """
         return len(self.nodes) - 1
 
-    def add_node(self, btype: BreakType, ptype: PhraseType) -> None:
+    def add_node(self, btype: BreakType, ptype: PhraseType,
+                 break_penalty: float = 0.0,
+                 term_lookup: str = '', term_normalized: str = '') -> None:
         """ Append a new break node with the given break type.
             The phrase type denotes the type for any tokens starting
             at the node.
         """
-        self.nodes.append(QueryNode(btype, ptype))
+        self.nodes.append(QueryNode(btype, ptype, break_penalty, term_lookup, term_normalized))
 
     def add_token(self, trange: TokenRange, ttype: TokenType, token: Token) -> None:
         """ Add a token to the query. 'start' and 'end' are the indexes of the
@@ -236,37 +305,63 @@ class QueryStruct:
             be added to, then the token is silently dropped.
         """
         snode = self.nodes[trange.start]
-        full_phrase = snode.btype in (BreakType.START, BreakType.PHRASE)\
-            and self.nodes[trange.end].btype in (BreakType.PHRASE, BreakType.END)
-        if snode.ptype.compatible_with(ttype, full_phrase):
-            tlist = snode.get_tokens(trange.end, ttype)
-            if tlist is None:
-                snode.starting.append(TokenList(trange.end, ttype, [token]))
-            else:
-                tlist.append(token)
+        if ttype == TOKEN_PARTIAL:
+            assert snode.partial is None
+            if _phrase_compatible_with(snode.ptype, TOKEN_PARTIAL, False):
+                snode.partial = token
+        else:
+            full_phrase = snode.btype in (BREAK_START, BREAK_PHRASE)\
+                and self.nodes[trange.end].btype in (BREAK_PHRASE, BREAK_END)
+            if _phrase_compatible_with(snode.ptype, ttype, full_phrase):
+                tlist = snode.get_tokens(trange.end, ttype)
+                if tlist is None:
+                    snode.starting.append(TokenList(trange.end, ttype, [token]))
+                else:
+                    tlist.append(token)
+
+    def compute_direction_penalty(self) -> None:
+        """ Recompute the direction probability from the partial tokens
+            of each node.
+        """
+        n = len(self.nodes) - 1
+        if n == 1 or n >= 50:
+            self.dir_penalty = 0
+        elif n == 2:
+            self.dir_penalty = (self.nodes[1].name_address_ratio()
+                                - self.nodes[0].name_address_ratio()) / 3
+        else:
+            ratios = [n.name_address_ratio() for n in self.nodes[:-1]]
+            self.dir_penalty = (n * sum(i * r for i, r in enumerate(ratios))
+                                - sum(ratios) * n * (n - 1) / 2) / LINFAC[n]
 
     def get_tokens(self, trange: TokenRange, ttype: TokenType) -> List[Token]:
         """ Get the list of tokens of a given type, spanning the given
             nodes. The nodes must exist. If no tokens exist, an
             empty list is returned.
+
+            Cannot be used to get the partial token.
         """
+        assert ttype != TOKEN_PARTIAL
         return self.nodes[trange.start].get_tokens(trange.end, ttype) or []
 
-    def get_partials_list(self, trange: TokenRange) -> List[Token]:
-        """ Create a list of partial tokens between the given nodes.
-            The list is composed of the first token of type PARTIAL
-            going to the subsequent node. Such PARTIAL tokens are
-            assumed to exist.
+    def iter_partials(self, trange: TokenRange) -> Iterator[Token]:
+        """ Iterate over the partial tokens between the given nodes.
+            Missing partials are ignored.
         """
-        return [next(iter(self.get_tokens(TokenRange(i, i+1), TokenType.PARTIAL)))
-                for i in range(trange.start, trange.end)]
+        return (n.partial for n in self.nodes[trange.start:trange.end] if n.partial is not None)
+
+    def iter_tokens_by_edge(self) -> Iterator[Tuple[int, int, Dict[TokenType, List[Token]]]]:
+        """ Iterator over all tokens except partial ones grouped by edge.
 
-    def iter_token_lists(self) -> Iterator[Tuple[int, QueryNode, TokenList]]:
-        """ Iterator over all token lists in the query.
+            Returns the start and end node indexes and a dictionary
+            of list of tokens by token type.
         """
         for i, node in enumerate(self.nodes):
+            by_end: Dict[int, Dict[TokenType, List[Token]]] = defaultdict(dict)
             for tlist in node.starting:
-                yield i, node, tlist
+                by_end[tlist.end][tlist.ttype] = tlist.tokens
+            for end, endlist in by_end.items():
+                yield i, end, endlist
 
     def find_lookup_word_by_id(self, token: int) -> str:
         """ Find the first token with the given token ID and return
@@ -275,8 +370,51 @@ class QueryStruct:
             debugging.
         """
         for node in self.nodes:
+            if node.partial is not None and node.partial.token == token:
+                return f"[P]{node.partial.lookup_word}"
             for tlist in node.starting:
                 for t in tlist.tokens:
                     if t.token == token:
-                        return f"[{tlist.ttype.name[0]}]{t.lookup_word}"
+                        return f"[{tlist.ttype}]{t.lookup_word}"
         return 'None'
+
+    def get_transliterated_query(self) -> str:
+        """ Return a string representation of the transliterated query
+            with the character representation of the different break types.
+
+            For debugging purposes only.
+        """
+        return ''.join(''.join((n.term_lookup, n.btype)) for n in self.nodes)
+
+    def extract_words(self, base_penalty: float = 0.0,
+                      start: int = 0,
+                      endpos: Optional[int] = None) -> Dict[str, List[TokenRange]]:
+        """ Add all combinations of words that can be formed from the terms
+            between the given start and endnode. The terms are joined with
+            spaces for each break. Words can never go across a BREAK_PHRASE.
+
+            The functions returns a dictionary of possible words with their
+            position within the query and a penalty. The penalty is computed
+            from the base_penalty plus the penalty for each node the word
+            crosses.
+        """
+        if endpos is None:
+            endpos = len(self.nodes)
+
+        words: Dict[str, List[TokenRange]] = defaultdict(list)
+
+        for first, first_node in enumerate(self.nodes[start + 1:endpos], start):
+            word = first_node.term_lookup
+            penalty = base_penalty
+            words[word].append(TokenRange(first, first + 1, penalty=penalty))
+            if first_node.btype != BREAK_PHRASE:
+                penalty += first_node.penalty
+                max_last = min(first + 20, endpos)
+                for last, last_node in enumerate(self.nodes[first + 2:max_last], first + 2):
+                    word = ' '.join((word, last_node.term_lookup))
+                    words[word].append(TokenRange(first, last, penalty=penalty))
+                    if last_node.btype == BREAK_PHRASE:
+                        break
+                    penalty += last_node.penalty
+
+        return words
diff --git a/src/nominatim_api/search/token_assignment.py b/src/nominatim_api/search/token_assignment.py
index a2e1804c..4247158c 100644
--- a/src/nominatim_api/search/token_assignment.py
+++ b/src/nominatim_api/search/token_assignment.py
@@ -24,12 +24,13 @@ class TypedRange:
 
 
 PENALTY_TOKENCHANGE = {
-    qmod.BreakType.START: 0.0,
-    qmod.BreakType.END: 0.0,
-    qmod.BreakType.PHRASE: 0.0,
-    qmod.BreakType.WORD: 0.1,
-    qmod.BreakType.PART: 0.2,
-    qmod.BreakType.TOKEN: 0.4
+    qmod.BREAK_START: 0.0,
+    qmod.BREAK_END: 0.0,
+    qmod.BREAK_PHRASE: 0.0,
+    qmod.BREAK_SOFT_PHRASE: 0.0,
+    qmod.BREAK_WORD: 0.1,
+    qmod.BREAK_PART: 0.2,
+    qmod.BREAK_TOKEN: 0.4
 }
 
 TypedRangeSeq = List[TypedRange]
@@ -55,17 +56,17 @@ class TokenAssignment:
         """
         out = TokenAssignment()
         for token in ranges:
-            if token.ttype == qmod.TokenType.PARTIAL:
+            if token.ttype == qmod.TOKEN_PARTIAL:
                 out.address.append(token.trange)
-            elif token.ttype == qmod.TokenType.HOUSENUMBER:
+            elif token.ttype == qmod.TOKEN_HOUSENUMBER:
                 out.housenumber = token.trange
-            elif token.ttype == qmod.TokenType.POSTCODE:
+            elif token.ttype == qmod.TOKEN_POSTCODE:
                 out.postcode = token.trange
-            elif token.ttype == qmod.TokenType.COUNTRY:
+            elif token.ttype == qmod.TOKEN_COUNTRY:
                 out.country = token.trange
-            elif token.ttype == qmod.TokenType.NEAR_ITEM:
+            elif token.ttype == qmod.TOKEN_NEAR_ITEM:
                 out.near_item = token.trange
-            elif token.ttype == qmod.TokenType.QUALIFIER:
+            elif token.ttype == qmod.TOKEN_QUALIFIER:
                 out.qualifier = token.trange
         return out
 
@@ -83,7 +84,7 @@ class _TokenSequence:
         self.penalty = penalty
 
     def __str__(self) -> str:
-        seq = ''.join(f'[{r.trange.start} - {r.trange.end}: {r.ttype.name}]' for r in self.seq)
+        seq = ''.join(f'[{r.trange.start} - {r.trange.end}: {r.ttype}]' for r in self.seq)
         return f'{seq} (dir: {self.direction}, penalty: {self.penalty})'
 
     @property
@@ -104,7 +105,7 @@ class _TokenSequence:
         """
         # Country and category must be the final term for left-to-right
         return len(self.seq) > 1 and \
-            self.seq[-1].ttype in (qmod.TokenType.COUNTRY, qmod.TokenType.NEAR_ITEM)
+            self.seq[-1].ttype in (qmod.TOKEN_COUNTRY, qmod.TOKEN_NEAR_ITEM)
 
     def appendable(self, ttype: qmod.TokenType) -> Optional[int]:
         """ Check if the give token type is appendable to the existing sequence.
@@ -113,23 +114,23 @@ class _TokenSequence:
             new direction of the sequence after adding such a type. The
             token is not added.
         """
-        if ttype == qmod.TokenType.WORD:
+        if ttype == qmod.TOKEN_WORD:
             return None
 
         if not self.seq:
             # Append unconditionally to the empty list
-            if ttype == qmod.TokenType.COUNTRY:
+            if ttype == qmod.TOKEN_COUNTRY:
                 return -1
-            if ttype in (qmod.TokenType.HOUSENUMBER, qmod.TokenType.QUALIFIER):
+            if ttype in (qmod.TOKEN_HOUSENUMBER, qmod.TOKEN_QUALIFIER):
                 return 1
             return self.direction
 
         # Name tokens are always acceptable and don't change direction
-        if ttype == qmod.TokenType.PARTIAL:
+        if ttype == qmod.TOKEN_PARTIAL:
             # qualifiers cannot appear in the middle of the query. They need
             # to be near the next phrase.
             if self.direction == -1 \
-               and any(t.ttype == qmod.TokenType.QUALIFIER for t in self.seq[:-1]):
+               and any(t.ttype == qmod.TOKEN_QUALIFIER for t in self.seq[:-1]):
                 return None
             return self.direction
 
@@ -137,54 +138,54 @@ class _TokenSequence:
         if self.has_types(ttype):
             return None
 
-        if ttype == qmod.TokenType.HOUSENUMBER:
+        if ttype == qmod.TOKEN_HOUSENUMBER:
             if self.direction == 1:
-                if len(self.seq) == 1 and self.seq[0].ttype == qmod.TokenType.QUALIFIER:
+                if len(self.seq) == 1 and self.seq[0].ttype == qmod.TOKEN_QUALIFIER:
                     return None
                 if len(self.seq) > 2 \
-                   or self.has_types(qmod.TokenType.POSTCODE, qmod.TokenType.COUNTRY):
+                   or self.has_types(qmod.TOKEN_POSTCODE, qmod.TOKEN_COUNTRY):
                     return None  # direction left-to-right: housenumber must come before anything
             elif (self.direction == -1
-                  or self.has_types(qmod.TokenType.POSTCODE, qmod.TokenType.COUNTRY)):
+                  or self.has_types(qmod.TOKEN_POSTCODE, qmod.TOKEN_COUNTRY)):
                 return -1  # force direction right-to-left if after other terms
 
             return self.direction
 
-        if ttype == qmod.TokenType.POSTCODE:
+        if ttype == qmod.TOKEN_POSTCODE:
             if self.direction == -1:
-                if self.has_types(qmod.TokenType.HOUSENUMBER, qmod.TokenType.QUALIFIER):
+                if self.has_types(qmod.TOKEN_HOUSENUMBER, qmod.TOKEN_QUALIFIER):
                     return None
                 return -1
             if self.direction == 1:
-                return None if self.has_types(qmod.TokenType.COUNTRY) else 1
-            if self.has_types(qmod.TokenType.HOUSENUMBER, qmod.TokenType.QUALIFIER):
+                return None if self.has_types(qmod.TOKEN_COUNTRY) else 1
+            if self.has_types(qmod.TOKEN_HOUSENUMBER, qmod.TOKEN_QUALIFIER):
                 return 1
             return self.direction
 
-        if ttype == qmod.TokenType.COUNTRY:
+        if ttype == qmod.TOKEN_COUNTRY:
             return None if self.direction == -1 else 1
 
-        if ttype == qmod.TokenType.NEAR_ITEM:
+        if ttype == qmod.TOKEN_NEAR_ITEM:
             return self.direction
 
-        if ttype == qmod.TokenType.QUALIFIER:
+        if ttype == qmod.TOKEN_QUALIFIER:
             if self.direction == 1:
                 if (len(self.seq) == 1
-                    and self.seq[0].ttype in (qmod.TokenType.PARTIAL, qmod.TokenType.NEAR_ITEM)) \
+                    and self.seq[0].ttype in (qmod.TOKEN_PARTIAL, qmod.TOKEN_NEAR_ITEM)) \
                    or (len(self.seq) == 2
-                       and self.seq[0].ttype == qmod.TokenType.NEAR_ITEM
-                       and self.seq[1].ttype == qmod.TokenType.PARTIAL):
+                       and self.seq[0].ttype == qmod.TOKEN_NEAR_ITEM
+                       and self.seq[1].ttype == qmod.TOKEN_PARTIAL):
                     return 1
                 return None
             if self.direction == -1:
                 return -1
 
-            tempseq = self.seq[1:] if self.seq[0].ttype == qmod.TokenType.NEAR_ITEM else self.seq
+            tempseq = self.seq[1:] if self.seq[0].ttype == qmod.TOKEN_NEAR_ITEM else self.seq
             if len(tempseq) == 0:
                 return 1
-            if len(tempseq) == 1 and self.seq[0].ttype == qmod.TokenType.HOUSENUMBER:
+            if len(tempseq) == 1 and self.seq[0].ttype == qmod.TOKEN_HOUSENUMBER:
                 return None
-            if len(tempseq) > 1 or self.has_types(qmod.TokenType.POSTCODE, qmod.TokenType.COUNTRY):
+            if len(tempseq) > 1 or self.has_types(qmod.TOKEN_POSTCODE, qmod.TOKEN_COUNTRY):
                 return -1
             return 0
 
@@ -204,7 +205,7 @@ class _TokenSequence:
             new_penalty = 0.0
         else:
             last = self.seq[-1]
-            if btype != qmod.BreakType.PHRASE and last.ttype == ttype:
+            if btype != qmod.BREAK_PHRASE and last.ttype == ttype:
                 # extend the existing range
                 newseq = self.seq[:-1] + [TypedRange(ttype, last.trange.replace_end(end_pos))]
                 new_penalty = 0.0
@@ -239,18 +240,18 @@ class _TokenSequence:
         # housenumbers may not be further than 2 words from the beginning.
         # If there are two words in front, give it a penalty.
         hnrpos = next((i for i, tr in enumerate(self.seq)
-                       if tr.ttype == qmod.TokenType.HOUSENUMBER),
+                       if tr.ttype == qmod.TOKEN_HOUSENUMBER),
                       None)
         if hnrpos is not None:
             if self.direction != -1:
-                priors = sum(1 for t in self.seq[:hnrpos] if t.ttype == qmod.TokenType.PARTIAL)
+                priors = sum(1 for t in self.seq[:hnrpos] if t.ttype == qmod.TOKEN_PARTIAL)
                 if not self._adapt_penalty_from_priors(priors, -1):
                     return False
             if self.direction != 1:
-                priors = sum(1 for t in self.seq[hnrpos+1:] if t.ttype == qmod.TokenType.PARTIAL)
+                priors = sum(1 for t in self.seq[hnrpos+1:] if t.ttype == qmod.TOKEN_PARTIAL)
                 if not self._adapt_penalty_from_priors(priors, 1):
                     return False
-            if any(t.ttype == qmod.TokenType.NEAR_ITEM for t in self.seq):
+            if any(t.ttype == qmod.TOKEN_NEAR_ITEM for t in self.seq):
                 self.penalty += 1.0
 
         return True
@@ -268,10 +269,9 @@ class _TokenSequence:
             # <address>,<postcode> should give preference to address search
             if base.postcode.start == 0:
                 penalty = self.penalty
-                self.direction = -1  # name searches are only possible backwards
             else:
                 penalty = self.penalty + 0.1
-                self.direction = 1  # name searches are only possible forwards
+            penalty += 0.1 * max(0, len(base.address) - 1)
             yield dataclasses.replace(base, penalty=penalty)
 
     def _get_assignments_address_forward(self, base: TokenAssignment,
@@ -281,8 +281,17 @@ class _TokenSequence:
         """
         first = base.address[0]
 
+        # The postcode must come after the name.
+        if base.postcode and base.postcode < first:
+            log().var_dump('skip forward', (base.postcode, first))
+            return
+
+        penalty = self.penalty
+        if not base.country and self.direction == 1 and query.dir_penalty > 0:
+            penalty += query.dir_penalty
+
         log().comment('first word = name')
-        yield dataclasses.replace(base, penalty=self.penalty,
+        yield dataclasses.replace(base, penalty=penalty,
                                   name=first, address=base.address[1:])
 
         # To paraphrase:
@@ -292,17 +301,18 @@ class _TokenSequence:
         #  * the containing phrase is strictly typed
         if (base.housenumber and first.end < base.housenumber.start)\
            or (base.qualifier and base.qualifier > first)\
-           or (query.nodes[first.start].ptype != qmod.PhraseType.NONE):
+           or (query.nodes[first.start].ptype != qmod.PHRASE_ANY):
             return
 
-        penalty = self.penalty
-
         # Penalty for:
         #  * <name>, <street>, <housenumber> , ...
         #  * queries that are comma-separated
         if (base.housenumber and base.housenumber > first) or len(query.source) > 1:
             penalty += 0.25
 
+        if self.direction == 0 and query.dir_penalty > 0:
+            penalty += query.dir_penalty
+
         for i in range(first.start + 1, first.end):
             name, addr = first.split(i)
             log().comment(f'split first word = name ({i - first.start})')
@@ -316,9 +326,18 @@ class _TokenSequence:
         """
         last = base.address[-1]
 
-        if self.direction == -1 or len(base.address) > 1:
+        # The postcode must come before the name for backward direction.
+        if base.postcode and base.postcode > last:
+            log().var_dump('skip backward', (base.postcode, last))
+            return
+
+        penalty = self.penalty
+        if not base.country and self.direction == -1 and query.dir_penalty < 0:
+            penalty -= query.dir_penalty
+
+        if self.direction == -1 or len(base.address) > 1 or base.postcode:
             log().comment('last word = name')
-            yield dataclasses.replace(base, penalty=self.penalty,
+            yield dataclasses.replace(base, penalty=penalty,
                                       name=last, address=base.address[:-1])
 
         # To paraphrase:
@@ -328,15 +347,17 @@ class _TokenSequence:
         #  * the containing phrase is strictly typed
         if (base.housenumber and last.start > base.housenumber.end)\
            or (base.qualifier and base.qualifier < last)\
-           or (query.nodes[last.start].ptype != qmod.PhraseType.NONE):
+           or (query.nodes[last.start].ptype != qmod.PHRASE_ANY):
             return
 
-        penalty = self.penalty
         if base.housenumber and base.housenumber < last:
             penalty += 0.4
         if len(query.source) > 1:
             penalty += 0.25
 
+        if self.direction == 0 and query.dir_penalty < 0:
+            penalty -= query.dir_penalty
+
         for i in range(last.start + 1, last.end):
             addr, name = last.split(i)
             log().comment(f'split last word = name ({i - last.start})')
@@ -369,11 +390,11 @@ class _TokenSequence:
             if base.postcode and base.postcode.start == 0:
                 self.penalty += 0.1
 
-            # Right-to-left reading of the address
+            # Left-to-right reading of the address
             if self.direction != -1:
                 yield from self._get_assignments_address_forward(base, query)
 
-            # Left-to-right reading of the address
+            # Right-to-left reading of the address
             if self.direction != 1:
                 yield from self._get_assignments_address_backward(base, query)
 
@@ -392,18 +413,29 @@ def yield_token_assignments(query: qmod.QueryStruct) -> Iterator[TokenAssignment
         another. It does not include penalties for transitions within a
         type.
     """
-    todo = [_TokenSequence([], direction=0 if query.source[0].ptype == qmod.PhraseType.NONE else 1)]
+    todo = [_TokenSequence([], direction=0 if query.source[0].ptype == qmod.PHRASE_ANY else 1)]
 
     while todo:
         state = todo.pop()
         node = query.nodes[state.end_pos]
 
         for tlist in node.starting:
-            newstate = state.advance(tlist.ttype, tlist.end, node.btype)
-            if newstate is not None:
-                if newstate.end_pos == query.num_token_slots():
-                    if newstate.recheck_sequence():
-                        log().var_dump('Assignment', newstate)
-                        yield from newstate.get_assignments(query)
-                elif not newstate.is_final():
-                    todo.append(newstate)
+            yield from _append_state_to_todo(
+                query, todo,
+                state.advance(tlist.ttype, tlist.end, node.btype))
+
+        if node.partial is not None:
+            yield from _append_state_to_todo(
+                query, todo,
+                state.advance(qmod.TOKEN_PARTIAL, state.end_pos + 1, node.btype))
+
+
+def _append_state_to_todo(query: qmod.QueryStruct, todo: List[_TokenSequence],
+                          newstate: Optional[_TokenSequence]) -> Iterator[TokenAssignment]:
+    if newstate is not None:
+        if newstate.end_pos == query.num_token_slots():
+            if newstate.recheck_sequence():
+                log().var_dump('Assignment', newstate)
+                yield from newstate.get_assignments(query)
+        elif not newstate.is_final():
+            todo.append(newstate)
diff --git a/src/nominatim_api/sql/sqlalchemy_functions.py b/src/nominatim_api/sql/sqlalchemy_functions.py
index 81fc83d6..00830f33 100644
--- a/src/nominatim_api/sql/sqlalchemy_functions.py
+++ b/src/nominatim_api/sql/sqlalchemy_functions.py
@@ -122,15 +122,18 @@ class IsAddressPoint(sa.sql.functions.GenericFunction[Any]):
 
     def __init__(self, table: sa.Table) -> None:
         super().__init__(table.c.rank_address,
-                         table.c.housenumber, table.c.name)
+                         table.c.housenumber, table.c.name, table.c.address)
 
 
 @compiles(IsAddressPoint)
 def default_is_address_point(element: IsAddressPoint,
                              compiler: 'sa.Compiled', **kw: Any) -> str:
-    rank, hnr, name = list(element.clauses)
-    return "(%s = 30 AND (%s IS NOT NULL OR %s ? 'addr:housename'))" % (
+    rank, hnr, name, address = list(element.clauses)
+    return "(%s = 30 AND (%s IS NULL OR NOT %s ? '_inherited')" \
+           " AND (%s IS NOT NULL OR %s ? 'addr:housename'))" % (
                 compiler.process(rank, **kw),
+                compiler.process(address, **kw),
+                compiler.process(address, **kw),
                 compiler.process(hnr, **kw),
                 compiler.process(name, **kw))
 
@@ -138,9 +141,11 @@ def default_is_address_point(element: IsAddressPoint,
 @compiles(IsAddressPoint, 'sqlite')
 def sqlite_is_address_point(element: IsAddressPoint,
                             compiler: 'sa.Compiled', **kw: Any) -> str:
-    rank, hnr, name = list(element.clauses)
-    return "(%s = 30 AND coalesce(%s, json_extract(%s, '$.addr:housename')) IS NOT NULL)" % (
+    rank, hnr, name, address = list(element.clauses)
+    return "(%s = 30 AND json_extract(%s, '$._inherited') IS NULL" \
+           " AND coalesce(%s, json_extract(%s, '$.addr:housename')) IS NOT NULL)" % (
                 compiler.process(rank, **kw),
+                compiler.process(address, **kw),
                 compiler.process(hnr, **kw),
                 compiler.process(name, **kw))
 
diff --git a/src/nominatim_api/sql/sqlalchemy_types/geometry.py b/src/nominatim_api/sql/sqlalchemy_types/geometry.py
index 90adcce8..583568c4 100644
--- a/src/nominatim_api/sql/sqlalchemy_types/geometry.py
+++ b/src/nominatim_api/sql/sqlalchemy_types/geometry.py
@@ -173,7 +173,7 @@ class Geometry(types.UserDefinedType):  # type: ignore[type-arg]
     def __init__(self, subtype: str = 'Geometry'):
         self.subtype = subtype
 
-    def get_col_spec(self) -> str:
+    def get_col_spec(self, **_: Any) -> str:
         return f'GEOMETRY({self.subtype}, 4326)'
 
     def bind_processor(self, dialect: 'sa.Dialect') -> Callable[[Any], str]:
diff --git a/src/nominatim_api/sql/sqlalchemy_types/json.py b/src/nominatim_api/sql/sqlalchemy_types/json.py
index 1c8f9f7b..f3ea9c6e 100644
--- a/src/nominatim_api/sql/sqlalchemy_types/json.py
+++ b/src/nominatim_api/sql/sqlalchemy_types/json.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Common json type for different dialects.
@@ -24,6 +24,6 @@ class Json(sa.types.TypeDecorator[Any]):
 
     def load_dialect_impl(self, dialect: SaDialect) -> sa.types.TypeEngine[Any]:
         if dialect.name == 'postgresql':
-            return JSONB(none_as_null=True)  # type: ignore[no-untyped-call]
+            return JSONB(none_as_null=True)
 
         return sqlite_json(none_as_null=True)
diff --git a/src/nominatim_api/types.py b/src/nominatim_api/types.py
index 66a3c553..e58df478 100644
--- a/src/nominatim_api/types.py
+++ b/src/nominatim_api/types.py
@@ -144,7 +144,7 @@ class Point(NamedTuple):
         except ValueError as exc:
             raise UsageError('Point parameter needs to be numbers.') from exc
 
-        if x < -180.0 or x > 180.0 or y < -90.0 or y > 90.0:
+        if not -180 <= x <= 180 or not -90 <= y <= 90.0:
             raise UsageError('Point coordinates invalid.')
 
         return Point(x, y)
diff --git a/src/nominatim_api/typing.py b/src/nominatim_api/typing.py
index 89aa4428..be9e9b58 100644
--- a/src/nominatim_api/typing.py
+++ b/src/nominatim_api/typing.py
@@ -21,9 +21,11 @@ if TYPE_CHECKING:
     from typing import Any
     import sqlalchemy as sa
     import os
-    from typing_extensions import (TypeAlias as TypeAlias)
+    from typing_extensions import (TypeAlias as TypeAlias,
+                                   Protocol as Protocol)
 else:
     TypeAlias = str
+    Protocol = object
 
 StrPath = Union[str, 'os.PathLike[str]']
 
diff --git a/src/nominatim_api/v1/classtypes.py b/src/nominatim_api/v1/classtypes.py
index 7198b412..c2fe1453 100644
--- a/src/nominatim_api/v1/classtypes.py
+++ b/src/nominatim_api/v1/classtypes.py
@@ -25,8 +25,8 @@ def get_label_tag(category: Tuple[str, str], extratags: Optional[Mapping[str, st
     elif rank < 26 and extratags and 'linked_place' in extratags:
         label = extratags['linked_place']
     elif category == ('boundary', 'administrative'):
-        label = ADMIN_LABELS.get((country or '', int(rank/2)))\
-                or ADMIN_LABELS.get(('', int(rank/2)))\
+        label = ADMIN_LABELS.get((country or '', rank // 2))\
+                or ADMIN_LABELS.get(('', rank // 2))\
                 or 'Administrative'
     elif category[1] == 'postal_code':
         label = 'postcode'
diff --git a/src/nominatim_api/v1/format_json.py b/src/nominatim_api/v1/format_json.py
index b397e702..9d7c3bd4 100644
--- a/src/nominatim_api/v1/format_json.py
+++ b/src/nominatim_api/v1/format_json.py
@@ -84,8 +84,9 @@ def format_base_json(results: Union[ReverseResults, SearchResults],
 
         _write_osm_id(out, result.osm_object)
 
-        out.keyval('lat', f"{result.centroid.lat}")\
-           .keyval('lon', f"{result.centroid.lon}")\
+        # lat and lon must be string values
+        out.keyval('lat', f"{result.centroid.lat:0.7f}")\
+           .keyval('lon', f"{result.centroid.lon:0.7f}")\
            .keyval(class_label, result.category[0])\
            .keyval('type', result.category[1])\
            .keyval('place_rank', result.rank_search)\
@@ -112,6 +113,7 @@ def format_base_json(results: Union[ReverseResults, SearchResults],
         if options.get('namedetails', False):
             out.keyval('namedetails', result.names)
 
+        # must be string values
         bbox = cl.bbox_from_result(result)
         out.key('boundingbox').start_array()\
            .value(f"{bbox.minlat:0.7f}").next()\
@@ -249,6 +251,9 @@ def format_base_geocodejson(results: Union[ReverseResults, SearchResults],
                         out.keyval(f"level{line.admin_level}", line.local_name)
             out.end_object().next()
 
+        if options.get('extratags', False):
+            out.keyval('extra', result.extratags)
+
         out.end_object().next().end_object().next()
 
         out.key('geometry').raw(result.geometry.get('geojson')
diff --git a/src/nominatim_api/v1/format_xml.py b/src/nominatim_api/v1/format_xml.py
index b3f0e562..ed6aca0a 100644
--- a/src/nominatim_api/v1/format_xml.py
+++ b/src/nominatim_api/v1/format_xml.py
@@ -90,7 +90,7 @@ def format_base_xml(results: Union[ReverseResults, SearchResults],
         result will be output, otherwise a list.
     """
     root = ET.Element(xml_root_tag)
-    root.set('timestamp', dt.datetime.utcnow().strftime('%a, %d %b %Y %H:%M:%S +00:00'))
+    root.set('timestamp', dt.datetime.now(dt.timezone.utc).strftime('%a, %d %b %Y %H:%M:%S +00:00'))
     root.set('attribution', cl.OSM_ATTRIBUTION)
     for k, v in xml_extra_info.items():
         root.set(k, v)
diff --git a/src/nominatim_api/version.py b/src/nominatim_api/version.py
index 8c4de5a4..3c98435d 100644
--- a/src/nominatim_api/version.py
+++ b/src/nominatim_api/version.py
@@ -8,4 +8,4 @@
 Version information for the Nominatim API.
 """
 
-NOMINATIM_API_VERSION = '4.5.0'
+NOMINATIM_API_VERSION = '5.1.0'
diff --git a/src/nominatim_db/cli.py b/src/nominatim_db/cli.py
index f5f74208..8d4585c6 100644
--- a/src/nominatim_db/cli.py
+++ b/src/nominatim_db/cli.py
@@ -2,16 +2,15 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Command-line interface to the Nominatim functions for import, update,
 database administration and querying.
 """
-from typing import Optional, Any
+from typing import Optional, List, Mapping
 import importlib
 import logging
-import os
 import sys
 import argparse
 import asyncio
@@ -81,13 +80,14 @@ class CommandlineParser:
         parser.set_defaults(command=cmd)
         cmd.add_args(parser)
 
-    def run(self, **kwargs: Any) -> int:
+    def run(self, cli_args: Optional[List[str]],
+            environ: Optional[Mapping[str, str]]) -> int:
         """ Parse the command line arguments of the program and execute the
             appropriate subcommand.
         """
         args = NominatimArgs()
         try:
-            self.parser.parse_args(args=kwargs.get('cli_args'), namespace=args)
+            self.parser.parse_args(args=cli_args, namespace=args)
         except SystemExit:
             return 1
 
@@ -101,23 +101,19 @@ class CommandlineParser:
 
         args.project_dir = Path(args.project_dir).resolve()
 
-        if 'cli_args' not in kwargs:
+        if cli_args is None:
             logging.basicConfig(stream=sys.stderr,
                                 format='%(asctime)s: %(message)s',
                                 datefmt='%Y-%m-%d %H:%M:%S',
                                 level=max(4 - args.verbose, 1) * 10)
 
-        args.config = Configuration(args.project_dir,
-                                    environ=kwargs.get('environ', os.environ))
-        args.config.set_libdirs(osm2pgsql=kwargs['osm2pgsql_path'])
+        args.config = Configuration(args.project_dir, environ=environ)
 
         log = logging.getLogger()
         log.warning('Using project directory: %s', str(args.project_dir))
 
         try:
-            ret = args.command.run(args)
-
-            return ret
+            return args.command.run(args)
         except UsageError as exception:
             if log.isEnabledFor(logging.DEBUG):
                 raise  # use Python's exception printing
@@ -233,9 +229,16 @@ def get_set_parser() -> CommandlineParser:
     return parser
 
 
-def nominatim(**kwargs: Any) -> int:
+def nominatim(cli_args: Optional[List[str]] = None,
+              environ: Optional[Mapping[str, str]] = None) -> int:
     """\
     Command-line tools for importing, updating, administrating and
     querying the Nominatim database.
+
+    'cli_args' is a list of parameters for the command to run. If not given,
+    sys.args will be used.
+
+    'environ' is the dictionary of environment variables containing the
+    Nominatim configuration. When None, the os.environ is inherited.
     """
-    return get_set_parser().run(**kwargs)
+    return get_set_parser().run(cli_args=cli_args, environ=environ)
diff --git a/src/nominatim_db/clicmd/args.py b/src/nominatim_db/clicmd/args.py
index 488ecd18..45df9b7c 100644
--- a/src/nominatim_db/clicmd/args.py
+++ b/src/nominatim_db/clicmd/args.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Provides custom functions over command-line arguments.
@@ -186,10 +186,10 @@ class NominatimArgs:
             from the command line arguments. The resulting dict can be
             further customized and then used in `run_osm2pgsql()`.
         """
-        return dict(osm2pgsql=self.config.OSM2PGSQL_BINARY or self.config.lib_dir.osm2pgsql,
+        return dict(osm2pgsql=self.config.OSM2PGSQL_BINARY,
                     osm2pgsql_cache=self.osm2pgsql_cache or default_cache,
                     osm2pgsql_style=self.config.get_import_style_file(),
-                    osm2pgsql_style_path=self.config.config_dir,
+                    osm2pgsql_style_path=self.config.lib_dir.lua,
                     threads=self.threads or default_threads,
                     dsn=self.config.get_libpq_dsn(),
                     flatnode_file=str(self.config.get_path('FLATNODE_FILE') or ''),
diff --git a/src/nominatim_db/clicmd/setup.py b/src/nominatim_db/clicmd/setup.py
index 39cbe65a..fb193838 100644
--- a/src/nominatim_db/clicmd/setup.py
+++ b/src/nominatim_db/clicmd/setup.py
@@ -122,13 +122,16 @@ class SetupAll:
 
         LOG.warning('Post-process tables')
         with connect(args.config.get_libpq_dsn()) as conn:
+            conn.autocommit = True
             await database_import.create_search_indices(conn, args.config,
                                                         drop=args.no_updates,
                                                         threads=num_threads)
             LOG.warning('Create search index for default country names.')
+            conn.autocommit = False
             country_info.create_country_names(conn, tokenizer,
                                               args.config.get_str_list('LANGUAGES'))
             if args.no_updates:
+                conn.autocommit = True
                 freeze.drop_update_tables(conn)
         tokenizer.finalize_import(args.config)
 
@@ -183,6 +186,7 @@ class SetupAll:
         from ..tools import database_import, refresh
 
         with connect(config.get_libpq_dsn()) as conn:
+            conn.autocommit = True
             LOG.warning('Create functions (1st pass)')
             refresh.create_functions(conn, config, False, False)
             LOG.warning('Create tables')
diff --git a/src/nominatim_db/config.py b/src/nominatim_db/config.py
index ad54ab3d..ba804122 100644
--- a/src/nominatim_db/config.py
+++ b/src/nominatim_db/config.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Nominatim configuration accessor.
@@ -73,8 +73,8 @@ class Configuration:
             self.project_dir = None
 
         class _LibDirs:
-            osm2pgsql: Path
             sql = paths.SQLLIB_DIR
+            lua = paths.LUALIB_DIR
             data = paths.DATA_DIR
 
         self.lib_dir = _LibDirs()
@@ -207,7 +207,7 @@ class Configuration:
         style = getattr(self, 'IMPORT_STYLE')
 
         if style in ('admin', 'street', 'address', 'full', 'extratags'):
-            return self.config_dir / f'import-{style}.lua'
+            return self.lib_dir.lua / f'import-{style}.lua'
 
         return self.find_config_file('', 'IMPORT_STYLE')
 
diff --git a/src/nominatim_db/db/connection.py b/src/nominatim_db/db/connection.py
index e960a3fa..cc843ab6 100644
--- a/src/nominatim_db/db/connection.py
+++ b/src/nominatim_db/db/connection.py
@@ -102,10 +102,10 @@ def server_version_tuple(conn: Connection) -> Tuple[int, int]:
         Converts correctly for pre-10 and post-10 PostgreSQL versions.
     """
     version = conn.info.server_version
-    if version < 100000:
-        return (int(version / 10000), int((version % 10000) / 100))
-
-    return (int(version / 10000), version % 10000)
+    major, minor = divmod(version, 10000)
+    if major < 10:
+        minor //= 100
+    return major, minor
 
 
 def postgis_version_tuple(conn: Connection) -> Tuple[int, int]:
diff --git a/src/nominatim_db/indexer/progress.py b/src/nominatim_db/indexer/progress.py
index 66c35f06..b99296e5 100644
--- a/src/nominatim_db/indexer/progress.py
+++ b/src/nominatim_db/indexer/progress.py
@@ -50,8 +50,8 @@ class ProgressLogger:
         places_per_sec = self.done_places / done_time
         eta = (self.total_places - self.done_places) / places_per_sec
 
-        LOG.warning("Done %d in %d @ %.3f per second - %s ETA (seconds): %.2f",
-                    self.done_places, int(done_time),
+        LOG.warning("Done %d in %.0f @ %.3f per second - %s ETA (seconds): %.2f",
+                    self.done_places, done_time,
                     places_per_sec, self.name, eta)
 
         self.next_info += int(places_per_sec) * self.log_interval
@@ -68,8 +68,8 @@ class ProgressLogger:
             diff_seconds = (rank_end_time - self.rank_start_time).total_seconds()
             places_per_sec = self.done_places / diff_seconds
 
-        LOG.warning("Done %d/%d in %d @ %.3f per second - FINISHED %s\n",
-                    self.done_places, self.total_places, int(diff_seconds),
+        LOG.warning("Done %d/%d in %.0f @ %.3f per second - FINISHED %s\n",
+                    self.done_places, self.total_places, diff_seconds,
                     places_per_sec, self.name)
 
         return self.done_places
diff --git a/src/nominatim_db/paths.py b/src/nominatim_db/paths.py
index 2614fa14..ab34e4c0 100644
--- a/src/nominatim_db/paths.py
+++ b/src/nominatim_db/paths.py
@@ -10,5 +10,6 @@ Path settings for extra data used by Nominatim.
 from pathlib import Path
 
 SQLLIB_DIR = (Path(__file__) / '..' / '..' / '..' / 'lib-sql').resolve()
+LUALIB_DIR = (Path(__file__) / '..' / '..' / '..' / 'lib-lua').resolve()
 DATA_DIR = (Path(__file__) / '..' / '..' / '..' / 'data').resolve()
 CONFIG_DIR = (Path(__file__) / '..' / '..' / '..' / 'settings').resolve()
diff --git a/src/nominatim_db/tokenizer/base.py b/src/nominatim_db/tokenizer/base.py
index 4b96cb23..af2816ec 100644
--- a/src/nominatim_db/tokenizer/base.py
+++ b/src/nominatim_db/tokenizer/base.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Abstract class definitions for tokenizers. These base classes are here
@@ -10,7 +10,6 @@ mainly for documentation purposes.
 """
 from abc import ABC, abstractmethod
 from typing import List, Tuple, Dict, Any, Optional, Iterable
-from pathlib import Path
 
 from ..typing import Protocol
 from ..config import Configuration
@@ -232,6 +231,6 @@ class TokenizerModule(Protocol):
         own tokenizer.
     """
 
-    def create(self, dsn: str, data_dir: Path) -> AbstractTokenizer:
+    def create(self, dsn: str) -> AbstractTokenizer:
         """ Factory for new tokenizers.
         """
diff --git a/src/nominatim_db/tokenizer/factory.py b/src/nominatim_db/tokenizer/factory.py
index 70b2b0be..43b65bae 100644
--- a/src/nominatim_db/tokenizer/factory.py
+++ b/src/nominatim_db/tokenizer/factory.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Functions for creating a tokenizer or initialising the right one for an
@@ -52,19 +52,10 @@ def create_tokenizer(config: Configuration, init_db: bool = True,
     if module_name is None:
         module_name = config.TOKENIZER
 
-    # Create the directory for the tokenizer data
-    assert config.project_dir is not None
-    basedir = config.project_dir / 'tokenizer'
-    if not basedir.exists():
-        basedir.mkdir()
-    elif not basedir.is_dir():
-        LOG.fatal("Tokenizer directory '%s' cannot be created.", basedir)
-        raise UsageError("Tokenizer setup failed.")
-
     # Import and initialize the tokenizer.
     tokenizer_module = _import_tokenizer(module_name)
 
-    tokenizer = tokenizer_module.create(config.get_libpq_dsn(), basedir)
+    tokenizer = tokenizer_module.create(config.get_libpq_dsn())
     tokenizer.init_new_db(config, init_db=init_db)
 
     with connect(config.get_libpq_dsn()) as conn:
@@ -79,12 +70,6 @@ def get_tokenizer_for_db(config: Configuration) -> AbstractTokenizer:
         The function looks up the appropriate tokenizer in the database
         and initialises it.
     """
-    assert config.project_dir is not None
-    basedir = config.project_dir / 'tokenizer'
-    if not basedir.is_dir():
-        # Directory will be repopulated by tokenizer below.
-        basedir.mkdir()
-
     with connect(config.get_libpq_dsn()) as conn:
         name = properties.get_property(conn, 'tokenizer')
 
@@ -94,7 +79,7 @@ def get_tokenizer_for_db(config: Configuration) -> AbstractTokenizer:
 
     tokenizer_module = _import_tokenizer(name)
 
-    tokenizer = tokenizer_module.create(config.get_libpq_dsn(), basedir)
+    tokenizer = tokenizer_module.create(config.get_libpq_dsn())
     tokenizer.init_from_project(config)
 
     return tokenizer
diff --git a/src/nominatim_db/tokenizer/icu_token_analysis.py b/src/nominatim_db/tokenizer/icu_token_analysis.py
index a3cdcb7a..c1ba106c 100644
--- a/src/nominatim_db/tokenizer/icu_token_analysis.py
+++ b/src/nominatim_db/tokenizer/icu_token_analysis.py
@@ -25,6 +25,8 @@ class ICUTokenAnalysis:
 
     def __init__(self, norm_rules: str, trans_rules: str,
                  analysis_rules: Mapping[Optional[str], 'TokenAnalyzerRule']):
+        # additional break signs are not relevant during name analysis
+        norm_rules += ";[[:Space:][-:]]+ > ' ';"
         self.normalizer = Transliterator.createFromRules("icu_normalization",
                                                          norm_rules)
         trans_rules += ";[:Space:]+ > ' '"
diff --git a/src/nominatim_db/tokenizer/icu_tokenizer.py b/src/nominatim_db/tokenizer/icu_tokenizer.py
index 16122d08..3fa867df 100644
--- a/src/nominatim_db/tokenizer/icu_tokenizer.py
+++ b/src/nominatim_db/tokenizer/icu_tokenizer.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tokenizer implementing normalisation as used before Nominatim 4 but using
@@ -12,7 +12,6 @@ from typing import Optional, Sequence, List, Tuple, Mapping, Any, cast, \
                    Dict, Set, Iterable
 import itertools
 import logging
-from pathlib import Path
 
 from psycopg.types.json import Jsonb
 from psycopg import sql as pysql
@@ -38,10 +37,10 @@ WORD_TYPES = (('country_names', 'C'),
               ('housenumbers', 'H'))
 
 
-def create(dsn: str, data_dir: Path) -> 'ICUTokenizer':
+def create(dsn: str) -> 'ICUTokenizer':
     """ Create a new instance of the tokenizer provided by this module.
     """
-    return ICUTokenizer(dsn, data_dir)
+    return ICUTokenizer(dsn)
 
 
 class ICUTokenizer(AbstractTokenizer):
@@ -50,9 +49,8 @@ class ICUTokenizer(AbstractTokenizer):
         normalization routines in Nominatim 3.
     """
 
-    def __init__(self, dsn: str, data_dir: Path) -> None:
+    def __init__(self, dsn: str) -> None:
         self.dsn = dsn
-        self.data_dir = data_dir
         self.loader: Optional[ICURuleLoader] = None
 
     def init_new_db(self, config: Configuration, init_db: bool = True) -> None:
@@ -121,10 +119,10 @@ class ICUTokenizer(AbstractTokenizer):
                            SELECT unnest(nameaddress_vector) as id, count(*)
                                  FROM search_name GROUP BY id)
                   SELECT coalesce(a.id, w.id) as id,
-                         (CASE WHEN w.count is null THEN '{}'::JSONB
+                         (CASE WHEN w.count is null or w.count <= 1 THEN '{}'::JSONB
                               ELSE jsonb_build_object('count', w.count) END
                           ||
-                          CASE WHEN a.count is null THEN '{}'::JSONB
+                          CASE WHEN a.count is null or a.count <= 1 THEN '{}'::JSONB
                               ELSE jsonb_build_object('addr_count', a.count) END) as info
                   FROM word_freq w FULL JOIN addr_freq a ON a.id = w.id;
                   """)
@@ -134,9 +132,10 @@ class ICUTokenizer(AbstractTokenizer):
                 drop_tables(conn, 'tmp_word')
                 cur.execute("""CREATE TABLE tmp_word AS
                                 SELECT word_id, word_token, type, word,
-                                       (CASE WHEN wf.info is null THEN word.info
-                                        ELSE coalesce(word.info, '{}'::jsonb) || wf.info
-                                        END) as info
+                                       coalesce(word.info, '{}'::jsonb)
+                                       - 'count' - 'addr_count' ||
+                                       coalesce(wf.info, '{}'::jsonb)
+                                       as info
                                 FROM word LEFT JOIN word_frequencies wf
                                      ON word.word_id = wf.id
                                 ORDER BY word_id
@@ -382,76 +381,15 @@ class ICUNameAnalyzer(AbstractAnalyzer):
         return postcode.strip().upper()
 
     def update_postcodes_from_db(self) -> None:
-        """ Update postcode tokens in the word table from the location_postcode
-            table.
+        """ Postcode update.
+
+            Removes all postcodes from the word table because they are not
+            needed. Postcodes are recognised by pattern.
         """
         assert self.conn is not None
-        analyzer = self.token_analysis.analysis.get('@postcode')
 
         with self.conn.cursor() as cur:
-            # First get all postcode names currently in the word table.
-            cur.execute("SELECT DISTINCT word FROM word WHERE type = 'P'")
-            word_entries = set((entry[0] for entry in cur))
-
-            # Then compute the required postcode names from the postcode table.
-            needed_entries = set()
-            cur.execute("SELECT country_code, postcode FROM location_postcode")
-            for cc, postcode in cur:
-                info = PlaceInfo({'country_code': cc,
-                                  'class': 'place', 'type': 'postcode',
-                                  'address': {'postcode': postcode}})
-                address = self.sanitizer.process_names(info)[1]
-                for place in address:
-                    if place.kind == 'postcode':
-                        if analyzer is None:
-                            postcode_name = place.name.strip().upper()
-                            variant_base = None
-                        else:
-                            postcode_name = analyzer.get_canonical_id(place)
-                            variant_base = place.get_attr("variant")
-
-                        if variant_base:
-                            needed_entries.add(f'{postcode_name}@{variant_base}')
-                        else:
-                            needed_entries.add(postcode_name)
-                        break
-
-        # Now update the word table.
-        self._delete_unused_postcode_words(word_entries - needed_entries)
-        self._add_missing_postcode_words(needed_entries - word_entries)
-
-    def _delete_unused_postcode_words(self, tokens: Iterable[str]) -> None:
-        assert self.conn is not None
-        if tokens:
-            with self.conn.cursor() as cur:
-                cur.execute("DELETE FROM word WHERE type = 'P' and word = any(%s)",
-                            (list(tokens), ))
-
-    def _add_missing_postcode_words(self, tokens: Iterable[str]) -> None:
-        assert self.conn is not None
-        if not tokens:
-            return
-
-        analyzer = self.token_analysis.analysis.get('@postcode')
-        terms = []
-
-        for postcode_name in tokens:
-            if '@' in postcode_name:
-                term, variant = postcode_name.split('@', 2)
-                term = self._search_normalized(term)
-                if analyzer is None:
-                    variants = [term]
-                else:
-                    variants = analyzer.compute_variants(variant)
-                    if term not in variants:
-                        variants.append(term)
-            else:
-                variants = [self._search_normalized(postcode_name)]
-            terms.append((postcode_name, variants))
-
-        if terms:
-            with self.conn.cursor() as cur:
-                cur.executemany("""SELECT create_postcode_word(%s, %s)""", terms)
+            cur.execute("DELETE FROM word WHERE type = 'P'")
 
     def update_special_phrases(self, phrases: Iterable[Tuple[str, str, str, str]],
                                should_replace: bool) -> None:
@@ -646,10 +584,14 @@ class ICUNameAnalyzer(AbstractAnalyzer):
             if word_id:
                 result = self._cache.housenumbers.get(word_id, result)
                 if result[0] is None:
-                    variants = analyzer.compute_variants(word_id)
+                    varout = analyzer.compute_variants(word_id)
+                    if isinstance(varout, tuple):
+                        variants = varout[0]
+                    else:
+                        variants = varout
                     if variants:
                         hid = execute_scalar(self.conn, "SELECT create_analyzed_hnr_id(%s, %s)",
-                                             (word_id, list(variants)))
+                                             (word_id, variants))
                         result = hid, variants[0]
                         self._cache.housenumbers[word_id] = result
 
@@ -694,13 +636,17 @@ class ICUNameAnalyzer(AbstractAnalyzer):
 
             full, part = self._cache.names.get(token_id, (None, None))
             if full is None:
-                variants = analyzer.compute_variants(word_id)
+                varset = analyzer.compute_variants(word_id)
+                if isinstance(varset, tuple):
+                    variants, lookups = varset
+                else:
+                    variants, lookups = varset, None
                 if not variants:
                     continue
 
                 with self.conn.cursor() as cur:
-                    cur.execute("SELECT * FROM getorcreate_full_word(%s, %s)",
-                                (token_id, variants))
+                    cur.execute("SELECT * FROM getorcreate_full_word(%s, %s, %s)",
+                                (token_id, variants, lookups))
                     full, part = cast(Tuple[int, List[int]], cur.fetchone())
 
                 self._cache.names[token_id] = (full, part)
@@ -719,32 +665,9 @@ class ICUNameAnalyzer(AbstractAnalyzer):
         analyzer = self.token_analysis.analysis.get('@postcode')
 
         if analyzer is None:
-            postcode_name = item.name.strip().upper()
-            variant_base = None
-        else:
-            postcode_name = analyzer.get_canonical_id(item)
-            variant_base = item.get_attr("variant")
-
-        if variant_base:
-            postcode = f'{postcode_name}@{variant_base}'
+            return item.name.strip().upper()
         else:
-            postcode = postcode_name
-
-        if postcode not in self._cache.postcodes:
-            term = self._search_normalized(postcode_name)
-            if not term:
-                return None
-
-            variants = {term}
-            if analyzer is not None and variant_base:
-                variants.update(analyzer.compute_variants(variant_base))
-
-            with self.conn.cursor() as cur:
-                cur.execute("SELECT create_postcode_word(%s, %s)",
-                            (postcode, list(variants)))
-            self._cache.postcodes.add(postcode)
-
-        return postcode_name
+            return analyzer.get_canonical_id(item)
 
 
 class _TokenInfo:
@@ -837,5 +760,4 @@ class _TokenCache:
         self.names: Dict[str, Tuple[int, List[int]]] = {}
         self.partials: Dict[str, int] = {}
         self.fulls: Dict[str, List[int]] = {}
-        self.postcodes: Set[str] = set()
         self.housenumbers: Dict[str, Tuple[Optional[int], Optional[str]]] = {}
diff --git a/src/nominatim_db/tokenizer/token_analysis/base.py b/src/nominatim_db/tokenizer/token_analysis/base.py
index 52ee8013..186f1d3e 100644
--- a/src/nominatim_db/tokenizer/token_analysis/base.py
+++ b/src/nominatim_db/tokenizer/token_analysis/base.py
@@ -7,7 +7,7 @@
 """
 Common data types and protocols for analysers.
 """
-from typing import Mapping, List, Any
+from typing import Mapping, List, Any, Union, Tuple
 
 from ...typing import Protocol
 from ...data.place_name import PlaceName
@@ -33,7 +33,7 @@ class Analyzer(Protocol):
                     for example because the character set in use does not match.
         """
 
-    def compute_variants(self, canonical_id: str) -> List[str]:
+    def compute_variants(self, canonical_id: str) -> Union[List[str], Tuple[List[str], List[str]]]:
         """ Compute the transliterated spelling variants for the given
             canonical ID.
 
diff --git a/src/nominatim_db/tokenizer/token_analysis/generic.py b/src/nominatim_db/tokenizer/token_analysis/generic.py
index 4aa84de7..b01cebf7 100644
--- a/src/nominatim_db/tokenizer/token_analysis/generic.py
+++ b/src/nominatim_db/tokenizer/token_analysis/generic.py
@@ -2,20 +2,19 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Generic processor for names that creates abbreviation variants.
 """
-from typing import Mapping, Dict, Any, Iterable, Iterator, Optional, List, cast
+from typing import Mapping, Dict, Any, Iterable, Optional, List, cast, Tuple
 import itertools
 
-import datrie
-
 from ...errors import UsageError
 from ...data.place_name import PlaceName
 from .config_variants import get_variant_config
 from .generic_mutation import MutationVariantGenerator
+from .simple_trie import SimpleTrie
 
 # Configuration section
 
@@ -25,8 +24,7 @@ def configure(rules: Mapping[str, Any], normalizer: Any, _: Any) -> Dict[str, An
     """
     config: Dict[str, Any] = {}
 
-    config['replacements'], config['chars'] = get_variant_config(rules.get('variants'),
-                                                                 normalizer)
+    config['replacements'], _ = get_variant_config(rules.get('variants'), normalizer)
     config['variant_only'] = rules.get('mode', '') == 'variant-only'
 
     # parse mutation rules
@@ -68,12 +66,8 @@ class GenericTokenAnalysis:
         self.variant_only = config['variant_only']
 
         # Set up datrie
-        if config['replacements']:
-            self.replacements = datrie.Trie(config['chars'])
-            for src, repllist in config['replacements']:
-                self.replacements[src] = repllist
-        else:
-            self.replacements = None
+        self.replacements: Optional[SimpleTrie[List[str]]] = \
+            SimpleTrie(config['replacements']) if config['replacements'] else None
 
         # set up mutation rules
         self.mutations = [MutationVariantGenerator(*cfg) for cfg in config['mutations']]
@@ -84,7 +78,7 @@ class GenericTokenAnalysis:
         """
         return cast(str, self.norm.transliterate(name.name)).strip()
 
-    def compute_variants(self, norm_name: str) -> List[str]:
+    def compute_variants(self, norm_name: str) -> Tuple[List[str], List[str]]:
         """ Compute the spelling variants for the given normalized name
             and transliterate the result.
         """
@@ -93,18 +87,20 @@ class GenericTokenAnalysis:
         for mutation in self.mutations:
             variants = mutation.generate(variants)
 
-        return [name for name in self._transliterate_unique_list(norm_name, variants) if name]
-
-    def _transliterate_unique_list(self, norm_name: str,
-                                   iterable: Iterable[str]) -> Iterator[Optional[str]]:
-        seen = set()
+        varset = set(map(str.strip, variants))
         if self.variant_only:
-            seen.add(norm_name)
+            varset.discard(norm_name)
+
+        trans = []
+        norm = []
+
+        for var in varset:
+            t = self.to_ascii.transliterate(var).strip()
+            if t:
+                trans.append(t)
+                norm.append(var)
 
-        for variant in map(str.strip, iterable):
-            if variant not in seen:
-                seen.add(variant)
-                yield self.to_ascii.transliterate(variant).strip()
+        return trans, norm
 
     def _generate_word_variants(self, norm_name: str) -> Iterable[str]:
         baseform = '^ ' + norm_name + ' ^'
@@ -116,10 +112,10 @@ class GenericTokenAnalysis:
             pos = 0
             force_space = False
             while pos < baselen:
-                full, repl = self.replacements.longest_prefix_item(baseform[pos:],
-                                                                   (None, None))
-                if full is not None:
-                    done = baseform[startpos:pos]
+                frm = pos
+                repl, pos = self.replacements.longest_prefix(baseform, pos)
+                if repl is not None:
+                    done = baseform[startpos:frm]
                     partials = [v + done + r
                                 for v, r in itertools.product(partials, repl)
                                 if not force_space or r.startswith(' ')]
@@ -128,11 +124,10 @@ class GenericTokenAnalysis:
                         # to be helpful. Only use the original term.
                         startpos = 0
                         break
-                    startpos = pos + len(full)
-                    if full[-1] == ' ':
-                        startpos -= 1
+                    if baseform[pos - 1] == ' ':
+                        pos -= 1
                         force_space = True
-                    pos = startpos
+                    startpos = pos
                 else:
                     pos += 1
                     force_space = False
diff --git a/src/nominatim_db/tokenizer/token_analysis/simple_trie.py b/src/nominatim_db/tokenizer/token_analysis/simple_trie.py
new file mode 100644
index 00000000..c86551df
--- /dev/null
+++ b/src/nominatim_db/tokenizer/token_analysis/simple_trie.py
@@ -0,0 +1,84 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Simple dict-based implementation of a trie structure.
+"""
+from typing import TypeVar, Generic, Tuple, Optional, List, Dict
+from collections import defaultdict
+
+T = TypeVar('T')
+
+
+class SimpleTrie(Generic[T]):
+    """ A simple read-only trie structure.
+        This structure supports examply one lookup operation,
+        which is longest-prefix lookup.
+    """
+
+    def __init__(self, data: Optional[List[Tuple[str, T]]] = None) -> None:
+        self._tree: Dict[str, 'SimpleTrie[T]'] = defaultdict(SimpleTrie[T])
+        self._value: Optional[T] = None
+        self._prefix = ''
+
+        if data:
+            for key, value in data:
+                self._add(key, 0, value)
+
+            self._make_compact()
+
+    def _add(self, word: str, pos: int, value: T) -> None:
+        """ (Internal) Add a sub-word to the trie.
+            The word is added from index 'pos'. If the sub-word to add
+            is empty, then the trie saves the given value.
+        """
+        if pos < len(word):
+            self._tree[word[pos]]._add(word, pos + 1, value)
+        else:
+            self._value = value
+
+    def _make_compact(self) -> None:
+        """ (Internal) Compress tree where there is exactly one subtree
+            and no value.
+
+            Compression works recursively starting at the leaf.
+        """
+        for t in self._tree.values():
+            t._make_compact()
+
+        if len(self._tree) == 1 and self._value is None:
+            assert not self._prefix
+            for k, v in self._tree.items():
+                self._prefix = k + v._prefix
+                self._tree = v._tree
+                self._value = v._value
+
+    def longest_prefix(self, word: str, start: int = 0) -> Tuple[Optional[T], int]:
+        """ Return the longest prefix match for the given word starting at
+            the position 'start'.
+
+            The function returns a tuple with the value for the longest match and
+            the position of the word after the match. If no match was found at
+            all, the function returns (None, start).
+        """
+        cur = self
+        pos = start
+        result: Tuple[Optional[T], int] = None, start
+
+        while True:
+            if cur._prefix:
+                if not word.startswith(cur._prefix, pos):
+                    return result
+                pos += len(cur._prefix)
+
+            if cur._value:
+                result = cur._value, pos
+
+            if pos >= len(word) or word[pos] not in cur._tree:
+                return result
+
+            cur = cur._tree[word[pos]]
+            pos += 1
diff --git a/src/nominatim_db/tools/database_import.py b/src/nominatim_db/tools/database_import.py
index a7ee807e..809a8839 100644
--- a/src/nominatim_db/tools/database_import.py
+++ b/src/nominatim_db/tools/database_import.py
@@ -127,7 +127,7 @@ def import_osm_data(osm_files: Union[Path, Sequence[Path]],
                 fsize += os.stat(str(fname)).st_size
         else:
             fsize = os.stat(str(osm_files)).st_size
-        options['osm2pgsql_cache'] = int(min((mem.available + mem.cached) * 0.75,
+        options['osm2pgsql_cache'] = int(min((mem.available + getattr(mem, 'cached', 0)) * 0.75,
                                              fsize * 2) / 1024 / 1024) + 1
 
     run_osm2pgsql(options)
diff --git a/src/nominatim_db/tools/exec_utils.py b/src/nominatim_db/tools/exec_utils.py
index fc3a7465..2d048bcb 100644
--- a/src/nominatim_db/tools/exec_utils.py
+++ b/src/nominatim_db/tools/exec_utils.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Helper functions for executing external programs.
@@ -39,7 +39,10 @@ def run_osm2pgsql(options: Mapping[str, Any]) -> None:
 
     if str(options['osm2pgsql_style']).endswith('.lua'):
         env['LUA_PATH'] = ';'.join((str(options['osm2pgsql_style_path'] / '?.lua'),
-                                    os.environ.get('LUAPATH', ';')))
+                                    os.environ.get('LUA_PATH', ';')))
+        env['THEMEPARK_PATH'] = str(options['osm2pgsql_style_path'] / 'themes')
+        if 'THEMEPARK_PATH' in os.environ:
+            env['THEMEPARK_PATH'] += ':' + os.environ['THEMEPARK_PATH']
         cmd.extend(('--output', 'flex'))
 
         for flavour in ('data', 'index'):
@@ -82,7 +85,7 @@ def _mk_tablespace_options(ttype: str, options: Mapping[str, Any]) -> List[str]:
 
 
 def _find_osm2pgsql_cmd(cmdline: Optional[str]) -> str:
-    if cmdline is not None:
+    if cmdline:
         return cmdline
 
     in_path = shutil.which('osm2pgsql')
diff --git a/src/nominatim_db/tools/postcodes.py b/src/nominatim_db/tools/postcodes.py
index 4763aa03..64427f41 100644
--- a/src/nominatim_db/tools/postcodes.py
+++ b/src/nominatim_db/tools/postcodes.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Functions for importing, updating and otherwise maintaining the table
@@ -64,11 +64,15 @@ class _PostcodeCollector:
             if normalized:
                 self.collected[normalized] += (x, y)
 
-    def commit(self, conn: Connection, analyzer: AbstractAnalyzer, project_dir: Path) -> None:
-        """ Update postcodes for the country from the postcodes selected so far
-            as well as any externally supplied postcodes.
+    def commit(self, conn: Connection, analyzer: AbstractAnalyzer,
+               project_dir: Optional[Path]) -> None:
+        """ Update postcodes for the country from the postcodes selected so far.
+
+            When 'project_dir' is set, then any postcode files found in this
+            directory are taken into account as well.
         """
-        self._update_from_external(analyzer, project_dir)
+        if project_dir is not None:
+            self._update_from_external(analyzer, project_dir)
         to_add, to_delete, to_update = self._compute_changes(conn)
 
         LOG.info("Processing country '%s' (%s added, %s deleted, %s updated).",
@@ -170,7 +174,7 @@ class _PostcodeCollector:
         return None
 
 
-def update_postcodes(dsn: str, project_dir: Path, tokenizer: AbstractTokenizer) -> None:
+def update_postcodes(dsn: str, project_dir: Optional[Path], tokenizer: AbstractTokenizer) -> None:
     """ Update the table of artificial postcodes.
 
         Computes artificial postcode centroids from the placex table,
diff --git a/src/nominatim_db/tools/special_phrases/sp_importer.py b/src/nominatim_db/tools/special_phrases/sp_importer.py
index 40b089a7..ac50377f 100644
--- a/src/nominatim_db/tools/special_phrases/sp_importer.py
+++ b/src/nominatim_db/tools/special_phrases/sp_importer.py
@@ -16,7 +16,6 @@
 from typing import Iterable, Tuple, Mapping, Sequence, Optional, Set
 import logging
 import re
-
 from psycopg.sql import Identifier, SQL
 
 from ...typing import Protocol
@@ -65,6 +64,29 @@ class SPImporter():
         # special phrases class/type on the wiki.
         self.table_phrases_to_delete: Set[str] = set()
 
+    def get_classtype_pairs(self, min: int = 0) -> Set[Tuple[str, str]]:
+        """
+            Returns list of allowed special phrases from the database,
+            restricting to a list of combinations of classes and types
+            which occur more than a specified amount of times.
+
+            Default value for this, if not specified, is at least once.
+        """
+        db_combinations = set()
+        query = f"""
+        SELECT class AS CLS, type AS typ
+        FROM placex
+        GROUP BY class, type
+        HAVING COUNT(*) > {min}
+        """
+
+        with self.db_connection.cursor() as db_cursor:
+            db_cursor.execute(SQL(query))
+            for row in db_cursor:
+                db_combinations.add((row[0], row[1]))
+
+        return db_combinations
+
     def import_phrases(self, tokenizer: AbstractTokenizer, should_replace: bool) -> None:
         """
             Iterate through all SpecialPhrases extracted from the
@@ -88,6 +110,7 @@ class SPImporter():
         self._create_classtype_table_and_indexes(class_type_pairs)
         if should_replace:
             self._remove_non_existent_tables_from_db()
+
         self.db_connection.commit()
 
         with tokenizer.name_analyzer() as analyzer:
@@ -177,10 +200,17 @@ class SPImporter():
         with self.db_connection.cursor() as db_cursor:
             db_cursor.execute("CREATE INDEX idx_placex_classtype ON placex (class, type)")
 
+        allowed_special_phrases = self.get_classtype_pairs()
+
         for pair in class_type_pairs:
             phrase_class = pair[0]
             phrase_type = pair[1]
 
+            if (phrase_class, phrase_type) not in allowed_special_phrases:
+                LOG.warning("Skipping phrase %s=%s: not in allowed special phrases",
+                            phrase_class, phrase_type)
+                continue
+
             table_name = _classtype_table(phrase_class, phrase_type)
 
             if table_name in self.table_phrases_to_delete:
diff --git a/src/nominatim_db/tools/tiger_data.py b/src/nominatim_db/tools/tiger_data.py
index 85110ae5..7b865570 100644
--- a/src/nominatim_db/tools/tiger_data.py
+++ b/src/nominatim_db/tools/tiger_data.py
@@ -108,8 +108,7 @@ async def add_tiger_data(data_dir: str, config: Configuration, threads: int,
 
         async with QueryPool(dsn, place_threads, autocommit=True) as pool:
             with tokenizer.name_analyzer() as analyzer:
-                lines = 0
-                for row in tar:
+                for lineno, row in enumerate(tar, 1):
                     try:
                         address = dict(street=row['street'], postcode=row['postcode'])
                         args = ('SRID=4326;' + row['geometry'],
@@ -124,10 +123,8 @@ async def add_tiger_data(data_dir: str, config: Configuration, threads: int,
                                                     %s::INT, %s::TEXT, %s::JSONB, %s::TEXT)""",
                         args)
 
-                    lines += 1
-                    if lines == 1000:
+                    if not lineno % 1000:
                         print('.', end='', flush=True)
-                    lines = 0
 
         print('', flush=True)
 
diff --git a/src/nominatim_db/utils/centroid.py b/src/nominatim_db/utils/centroid.py
index a45d958b..02512336 100644
--- a/src/nominatim_db/utils/centroid.py
+++ b/src/nominatim_db/utils/centroid.py
@@ -30,8 +30,8 @@ class PointsCentroid:
         if self.count == 0:
             raise ValueError("No points available for centroid.")
 
-        return (float(self.sum_x/self.count)/10000000,
-                float(self.sum_y/self.count)/10000000)
+        return (self.sum_x / self.count / 10_000_000,
+                self.sum_y / self.count / 10_000_000)
 
     def __len__(self) -> int:
         return self.count
@@ -40,8 +40,8 @@ class PointsCentroid:
         if isinstance(other, Collection) and len(other) == 2:
             if all(isinstance(p, (float, int)) for p in other):
                 x, y = other
-                self.sum_x += int(x * 10000000)
-                self.sum_y += int(y * 10000000)
+                self.sum_x += int(x * 10_000_000)
+                self.sum_y += int(y * 10_000_000)
                 self.count += 1
                 return self
 
diff --git a/src/nominatim_db/version.py b/src/nominatim_db/version.py
index 75f2b7d6..070417e3 100644
--- a/src/nominatim_db/version.py
+++ b/src/nominatim_db/version.py
@@ -55,7 +55,7 @@ def parse_version(version: str) -> NominatimVersion:
     return NominatimVersion(*[int(x) for x in parts[:2] + parts[2].split('-')])
 
 
-NOMINATIM_VERSION = parse_version('4.5.0-0')
+NOMINATIM_VERSION = parse_version('5.1.0-0')
 
 POSTGRESQL_REQUIRED_VERSION = (12, 0)
 POSTGIS_REQUIRED_VERSION = (3, 0)
diff --git a/test/Makefile b/test/Makefile
deleted file mode 100644
index 9768ebd7..00000000
--- a/test/Makefile
+++ /dev/null
@@ -1,10 +0,0 @@
-all: bdd python
-
-bdd:
-	cd bdd && behave -DREMOVE_TEMPLATE=1
-
-python:
-	pytest python
-
-
-.PHONY: bdd python
diff --git a/test/bdd/.behaverc b/test/bdd/.behaverc
deleted file mode 100644
index 1b426ec9..00000000
--- a/test/bdd/.behaverc
+++ /dev/null
@@ -1,3 +0,0 @@
-[behave]
-show_skipped=False
-default_tags=~@Fail
diff --git a/test/bdd/api/details/language.feature b/test/bdd/api/details/language.feature
deleted file mode 100644
index 5351ce41..00000000
--- a/test/bdd/api/details/language.feature
+++ /dev/null
@@ -1,63 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Localization of search results
-
-    Scenario: default language
-        When sending details query for R1155955
-        Then results contain
-          | ID | localname |
-          | 0  | Liechtenstein |
-
-    Scenario: accept-language first
-        When sending details query for R1155955
-          | accept-language |
-          | zh,de |
-        Then results contain
-          | ID | localname |
-          | 0  | åæ¯æ¦å£«ç» |
-
-    Scenario: accept-language missing
-        When sending details query for R1155955
-          | accept-language |
-          | xx,fr,en,de |
-        Then results contain
-          | ID | localname |
-          | 0  | Liechtenstein |
-
-    Scenario: http accept language header first
-        Given the HTTP header
-          | accept-language |
-          | fo;q=0.8,en-ca;q=0.5,en;q=0.3 |
-        When sending details query for R1155955
-        Then results contain
-          | ID | localname |
-          | 0  | Liktinstein |
-
-    Scenario: http accept language header and accept-language
-        Given the HTTP header
-          | accept-language |
-          | fr-ca,fr;q=0.8,en-ca;q=0.5,en;q=0.3 |
-        When sending details query for R1155955
-          | accept-language |
-          | fo,en |
-        Then results contain
-          | ID | localname |
-          | 0  | Liktinstein |
-
-    Scenario: http accept language header fallback
-        Given the HTTP header
-          | accept-language |
-          | fo-ca,en-ca;q=0.5 |
-        When sending details query for R1155955
-        Then results contain
-          | ID | localname |
-          | 0  | Liktinstein |
-
-    Scenario: http accept language header fallback (upper case)
-        Given the HTTP header
-          | accept-language |
-          | fo-FR;q=0.8,en-ca;q=0.5 |
-        When sending details query for R1155955
-        Then results contain
-          | ID | localname |
-          | 0  | Liktinstein |
diff --git a/test/bdd/api/details/params.feature b/test/bdd/api/details/params.feature
deleted file mode 100644
index 0fb64171..00000000
--- a/test/bdd/api/details/params.feature
+++ /dev/null
@@ -1,96 +0,0 @@
-@APIDB
-Feature: Object details
-    Testing different parameter options for details API.
-
-    @SQLITE
-    Scenario: JSON Details
-        When sending json details query for W297699560
-        Then the result is valid json
-        And result has attributes geometry
-        And result has not attributes keywords,address,linked_places,parentof
-        And results contain in field geometry
-            | type  |
-            | Point |
-
-    @SQLITE
-    Scenario: JSON Details with pretty printing
-        When sending json details query for W297699560
-            | pretty |
-            | 1      |
-        Then the result is valid json
-        And result has attributes geometry
-        And result has not attributes keywords,address,linked_places,parentof
-
-    @SQLITE
-     Scenario: JSON Details with addressdetails
-        When sending json details query for W297699560
-            | addressdetails |
-            | 1 |
-        Then the result is valid json
-        And result has attributes address
-
-    @SQLITE
-    Scenario: JSON Details with linkedplaces
-        When sending json details query for R123924
-            | linkedplaces |
-            | 1 |
-        Then the result is valid json
-        And result has attributes linked_places
-
-    @SQLITE
-    Scenario: JSON Details with hierarchy
-        When sending json details query for W297699560
-            | hierarchy |
-            | 1 |
-        Then the result is valid json
-        And result has attributes hierarchy
-
-    @SQLITE
-    Scenario: JSON Details with grouped hierarchy
-        When sending json details query for W297699560
-            | hierarchy | group_hierarchy |
-            | 1         | 1 |
-        Then the result is valid json
-        And result has attributes hierarchy
-
-     Scenario Outline: JSON Details with keywords
-        When sending json details query for <osmid>
-            | keywords |
-            | 1 |
-        Then the result is valid json
-        And result has attributes keywords
-
-    Examples:
-            | osmid |
-            | W297699560 |
-            | W243055645 |
-            | W243055716 |
-            | W43327921  |
-
-    # ticket #1343
-    Scenario: Details of a country with keywords
-        When sending details query for R1155955
-            | keywords |
-            | 1 |
-        Then the result is valid json
-        And result has attributes keywords
-
-    @SQLITE
-    Scenario Outline: JSON details with full geometry
-        When sending json details query for <osmid>
-            | polygon_geojson |
-            | 1 |
-        Then the result is valid json
-        And result has attributes geometry
-        And results contain in field geometry
-            | type       |
-            | <geometry> |
-
-    Examples:
-            | osmid      | geometry   |
-            | W297699560 | LineString |
-            | W243055645 | Polygon    |
-            | W243055716 | Polygon    |
-            | W43327921  | LineString |
-
-
diff --git a/test/bdd/api/details/simple.feature b/test/bdd/api/details/simple.feature
deleted file mode 100644
index 5e0bacc5..00000000
--- a/test/bdd/api/details/simple.feature
+++ /dev/null
@@ -1,82 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Object details
-    Check details page for correctness
-
-    Scenario Outline: Details via OSM id
-        When sending details query for <type><id>
-        Then the result is valid json
-        And results contain
-            | osm_type | osm_id |
-            | <type>   | <id> |
-
-    Examples:
-     | type | id |
-     | N    | 5484325405 |
-     | W    | 43327921 |
-     | R    | 123924 |
-
-
-    Scenario Outline: Details for different class types for the same OSM id
-        When sending details query for N300209696:<class>
-        Then the result is valid json
-        And results contain
-          | osm_type | osm_id    | category |
-          | N        | 300209696 | <class> |
-
-    Examples:
-     | class |
-     | tourism |
-     | natural |
-     | mountain_pass |
-
-
-    Scenario Outline: Details via unknown OSM id
-        When sending details query for <object>
-        Then a HTTP 404 is returned
-
-    Examples:
-      | object |
-      | 1 |
-      | R1 |
-      | N300209696:highway |
-
-
-     Scenario: Details for interpolation way return the interpolation
-        When sending details query for W1
-        Then the result is valid json
-        And results contain
-            | category | type   | osm_type | osm_id | admin_level |
-            | place    | houses | W        | 1      | 15          |
-
-
-     @Fail
-     Scenario: Details for interpolation way return the interpolation
-        When sending details query for 112871
-        Then the result is valid json
-        And results contain
-            | category | type   | admin_level |
-            | place    | houses | 15          |
-        And result has not attributes osm_type,osm_id
-
-
-     @Fail
-     Scenario: Details for interpolation way return the interpolation
-        When sending details query for 112820
-        Then the result is valid json
-        And results contain
-            | category | type     | admin_level |
-            | place    | postcode | 15          |
-        And result has not attributes osm_type,osm_id
-
-
-    Scenario Outline: Details debug output returns no errors
-        When sending debug details query for <feature>
-        Then the result is valid html
-
-        Examples:
-          | feature     |
-          | N5484325405 |
-          | W1          |
-          | 112820      |
-          | 112871      |
diff --git a/test/bdd/api/errors/formats.feature b/test/bdd/api/errors/formats.feature
deleted file mode 100644
index e279a8fa..00000000
--- a/test/bdd/api/errors/formats.feature
+++ /dev/null
@@ -1,14 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Places by osm_type and osm_id Tests
-    Simple tests for errors in various response formats.
-
-    Scenario Outline: Force error by providing too many ids
-        When sending <format> lookup query for N1,N2,N3,N4,N5,N6,N7,N8,N9,N10,N11,N12,N13,N14,N15,N16,N17,N18,N19,N20,N21,N22,N23,N24,N25,N26,N27,N28,N29,N30,N31,N32,N33,N34,N35,N36,N37,N38,N39,N40,N41,N42,N43,N44,N45,N46,N47,N48,N49,N50,N51
-        Then a <format> user error is returned
-
-    Examples:
-        | format  |
-        | xml     |
-        | json    |
-        | geojson |
diff --git a/test/bdd/api/lookup/simple.feature b/test/bdd/api/lookup/simple.feature
deleted file mode 100644
index 1e5b8ee7..00000000
--- a/test/bdd/api/lookup/simple.feature
+++ /dev/null
@@ -1,42 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Places by osm_type and osm_id Tests
-    Simple tests for response format.
-
-    Scenario Outline: address lookup for existing node, way, relation
-        When sending <format> lookup query for N5484325405,W43327921,,R123924,X99,N0
-        Then the result is valid <outformat>
-        And exactly 3 results are returned
-
-    Examples:
-        | format      | outformat   |
-        | xml         | xml         |
-        | json        | json        |
-        | jsonv2      | json        |
-        | geojson     | geojson     |
-        | geocodejson | geocodejson |
-
-    Scenario: address lookup for non-existing or invalid node, way, relation
-        When sending xml lookup query for X99,,N0,nN158845944,ABC,,W9
-        Then exactly 0 results are returned
-
-    Scenario Outline: Boundingbox is returned
-        When sending <format> lookup query for N5484325405,W43327921
-        Then exactly 2 results are returned
-        And result 0 has bounding box in 47.135,47.14,9.52,9.525
-        And result 1 has bounding box in 47.07,47.08,9.50,9.52
-
-    Examples:
-      | format |
-      | json |
-      | jsonv2 |
-      | geojson |
-      | xml |
-
-
-    Scenario: Lookup of a linked place
-        When sending geocodejson lookup query for N1932181216
-        Then exactly 1 result is returned
-        And results contain
-          | name  |
-          | Vaduz |
diff --git a/test/bdd/api/reverse/geometry.feature b/test/bdd/api/reverse/geometry.feature
deleted file mode 100644
index aac82807..00000000
--- a/test/bdd/api/reverse/geometry.feature
+++ /dev/null
@@ -1,45 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Geometries for reverse geocoding
-    Tests for returning geometries with reverse
-
-
-    Scenario: Polygons are returned fully by default
-        When sending v1/reverse at 47.13803,9.52264
-          | polygon_text |
-          | 1            |
-        Then results contain
-          | geotext |
-          | ^POLYGON\(\(9.5225302 47.138066, ?9.5225348 47.1379282, ?9.5226142 47.1379294, ?9.5226143 47.1379257, ?9.522615 47.137917, ?9.5226225 47.1379098, ?9.5226334 47.1379052, ?9.5226461 47.1379037, ?9.5226588 47.1379056, ?9.5226693 47.1379107, ?9.5226762 47.1379181, ?9.5226762 47.1379268, ?9.5226761 47.1379308, ?9.5227366 47.1379317, ?9.5227352 47.1379753, ?9.5227608 47.1379757, ?9.5227595 47.1380148, ?9.5227355 47.1380145, ?9.5227337 47.1380692, ?9.5225302 47.138066\)\) |
-
-
-    Scenario: Polygons can be slightly simplified
-        When sending v1/reverse at 47.13803,9.52264
-          | polygon_text | polygon_threshold |
-          | 1            | 0.00001            |
-        Then results contain
-          | geotext |
-          | ^POLYGON\(\(9.5225302 47.138066, ?9.5225348 47.1379282, ?9.5226142 47.1379294, ?9.5226225 47.1379098, ?9.5226588 47.1379056, ?9.5226761 47.1379308, ?9.5227366 47.1379317, ?9.5227352 47.1379753, ?9.5227608 47.1379757, ?9.5227595 47.1380148, ?9.5227355 47.1380145, ?9.5227337 47.1380692, ?9.5225302 47.138066\)\) |
-
-
-    Scenario: Polygons can be much simplified
-        When sending v1/reverse at 47.13803,9.52264
-          | polygon_text | polygon_threshold |
-          | 1            | 0.9               |
-        Then results contain
-          | geotext |
-          | ^POLYGON\(\([0-9. ]+, ?[0-9. ]+, ?[0-9. ]+, ?[0-9. ]+(, ?[0-9. ]+)?\)\) |
-
-
-    Scenario: For polygons return the centroid as center point
-        When sending v1/reverse at 47.13836,9.52304
-        Then results contain
-          | centroid               |
-          | 9.52271080 47.13818045 |
-
-
-    Scenario: For streets return the closest point as center point
-        When sending v1/reverse at 47.13368,9.52942
-        Then results contain
-          | centroid    |
-          | 9.529431527 47.13368172 |
diff --git a/test/bdd/api/reverse/language.feature b/test/bdd/api/reverse/language.feature
deleted file mode 100644
index 69f84ebc..00000000
--- a/test/bdd/api/reverse/language.feature
+++ /dev/null
@@ -1,37 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Localization of reverse search results
-
-    Scenario: default language
-        When sending v1/reverse at 47.14,9.55
-        Then result addresses contain
-          | ID | country |
-          | 0  | Liechtenstein |
-
-    Scenario: accept-language parameter
-        When sending v1/reverse at 47.14,9.55
-          | accept-language |
-          | ja,en |
-        Then result addresses contain
-          | ID | country |
-          | 0  | ãªããã³ã·ã¥ã¿ã¤ã³ |
-
-    Scenario: HTTP accept language header
-        Given the HTTP header
-          | accept-language |
-          | fo-ca,fo;q=0.8,en-ca;q=0.5,en;q=0.3 |
-        When sending v1/reverse at 47.14,9.55
-        Then result addresses contain
-          | ID | country |
-          | 0  | Liktinstein |
-
-    Scenario: accept-language parameter and HTTP header
-        Given the HTTP header
-          | accept-language |
-          | fo-ca,fo;q=0.8,en-ca;q=0.5,en;q=0.3 |
-        When sending v1/reverse at 47.14,9.55
-          | accept-language |
-          | en |
-        Then result addresses contain
-          | ID | country |
-          | 0  | Liechtenstein |
diff --git a/test/bdd/api/reverse/queries.feature b/test/bdd/api/reverse/queries.feature
deleted file mode 100644
index f154b18d..00000000
--- a/test/bdd/api/reverse/queries.feature
+++ /dev/null
@@ -1,113 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Reverse geocoding
-    Testing the reverse function
-
-    Scenario Outline: Simple reverse-geocoding with no results
-        When sending v1/reverse at <lat>,<lon>
-        Then exactly 0 results are returned
-
-    Examples:
-     | lat      | lon |
-     | 0.0      | 0.0 |
-     | -34.830  | -56.105 |
-     | 45.174   | -103.072 |
-     | 21.156   | -12.2744 |
-     | 91.3     | 0.4    |
-     | -700     | 0.4    |
-     | 0.2      | 324.44 |
-     | 0.2      | -180.4 |
-
-
-    @Tiger
-    Scenario: TIGER house number
-        When sending v1/reverse at 32.4752389363,-86.4810198619
-        Then results contain
-          | category | type |
-          | place    | house |
-        And result addresses contain
-          | house_number | road                | postcode | country_code |
-          | 707          | Upper Kingston Road | 36067    | us |
-
-    @Tiger
-    Scenario: No TIGER house number for zoom < 18
-        When sending v1/reverse at 32.4752389363,-86.4810198619
-          | zoom |
-          | 17 |
-        Then results contain
-          | osm_type | category |
-          | way      | highway  |
-        And result addresses contain
-          | road                | postcode | country_code |
-          | Upper Kingston Road | 36067    | us |
-
-    Scenario: Interpolated house number
-        When sending v1/reverse at 47.118533,9.57056562
-        Then results contain
-          | osm_type | category | type |
-          | way      | place    | house |
-        And result addresses contain
-          | house_number | road |
-          | 1019         | Grosssteg |
-
-    Scenario: Address with non-numerical house number
-        When sending v1/reverse at 47.107465,9.52838521614
-        Then result addresses contain
-          | house_number | road |
-          | 39A/B        | Dorfstrasse |
-
-
-    Scenario: Address with numerical house number
-        When sending v1/reverse at 47.168440329479594,9.511551699184338
-        Then result addresses contain
-          | house_number | road |
-          | 6            | SchmedgÃ¤ssle |
-
-    Scenario Outline: Zoom levels below 5 result in country
-        When sending v1/reverse at 47.16,9.51
-         | zoom |
-         | <zoom> |
-        Then results contain
-         | display_name |
-         | Liechtenstein |
-
-    Examples:
-         | zoom |
-         | 0    |
-         | 1    |
-         | 2    |
-         | 3    |
-         | 4    |
-
-    Scenario: When on a street, the closest interpolation is shown
-        When sending v1/reverse at 47.118457166193245,9.570678289621355
-         | zoom |
-         | 18 |
-        Then results contain
-         | display_name |
-         | 1021, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
-
-    # github 2214
-    Scenario: Interpolations do not override house numbers when they are closer
-        When sending v1/reverse at 47.11778,9.57255
-         | zoom |
-         | 18 |
-        Then results contain
-         | display_name |
-         | 5, Grosssteg, Steg, Triesenberg, Oberland, 9497, Liechtenstein |
-
-    Scenario: Interpolations do not override house numbers when they are closer (2)
-        When sending v1/reverse at 47.11834,9.57167
-         | zoom |
-         | 18 |
-        Then results contain
-         | display_name |
-         | 3, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
-
-    Scenario: When on a street with zoom 18, the closest housenumber is returned
-        When sending v1/reverse at 47.11755503977281,9.572722250405036
-         | zoom |
-         | 18 |
-        Then result addresses contain
-         | house_number |
-         | 7 |
diff --git a/test/bdd/api/reverse/v1_geocodejson.feature b/test/bdd/api/reverse/v1_geocodejson.feature
deleted file mode 100644
index 56b85e20..00000000
--- a/test/bdd/api/reverse/v1_geocodejson.feature
+++ /dev/null
@@ -1,107 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Geocodejson for Reverse API
-    Testing correctness of geocodejson output (API version v1).
-
-    Scenario Outline: Simple OSM result
-        When sending v1/reverse at 47.066,9.504 with format geocodejson
-          | addressdetails |
-          | <has_address>  |
-        Then result has attributes place_id, accuracy
-        And result has <attributes> country,postcode,county,city,district,street,housenumber, admin
-        Then results contain
-          | osm_type | osm_id     | osm_key | osm_value | type  |
-          | node     | 6522627624 | shop    | bakery    | house |
-        And results contain
-          | name                  | label |
-          | DorfbÃ¤ckerei Herrmann | DorfbÃ¤ckerei Herrmann, 29, Gnetsch, MÃ¤ls, Balzers, Oberland, 9496, Liechtenstein |
-        And results contain in field geojson
-          | type  | coordinates             |
-          | Point | [9.5036065, 47.0660892] |
-        And results contain in field __geocoding
-          | version | licence | attribution |
-          | 0.1.0   | ODbL    | ^Data Â© OpenStreetMap contributors, ODbL 1.0. https?://osm.org/copyright$ |
-
-        Examples:
-          | has_address | attributes     |
-          | 1           | attributes     |
-          | 0           | not attributes |
-
-
-    Scenario: City housenumber-level address with street
-        When sending v1/reverse at 47.1068011,9.52810091 with format geocodejson
-        Then results contain
-          | housenumber | street    | postcode | city    | country |
-          | 8           | Im Winkel | 9495     | Triesen | Liechtenstein |
-         And results contain in field admin
-          | level6   | level8  |
-          | Oberland | Triesen |
-
-
-    Scenario: Town street-level address with street
-        When sending v1/reverse at 47.066,9.504 with format geocodejson
-          | zoom |
-          | 16 |
-        Then results contain
-          | name    | city    | postcode | country |
-          | Gnetsch | Balzers | 9496     | Liechtenstein |
-
-
-    Scenario: Poi street-level address with footway
-        When sending v1/reverse at 47.06515,9.50083 with format geocodejson
-        Then results contain
-          | street  | city    | postcode | country |
-          | Burgweg | Balzers | 9496     | Liechtenstein |
-
-
-    Scenario: City address with suburb
-        When sending v1/reverse at 47.146861,9.511771 with format geocodejson
-        Then results contain
-          | housenumber | street   | district | city  | postcode | country |
-          | 5           | Lochgass | Ebenholz | Vaduz | 9490     | Liechtenstein |
-
-
-    @Tiger
-    Scenario: Tiger address
-        When sending v1/reverse at 32.4752389363,-86.4810198619 with format geocodejson
-        Then results contain
-         | osm_type | osm_id    | osm_key | osm_value | type  |
-         | way      | 396009653 | place   | house     | house |
-        And results contain
-         | housenumber | street              | city       | county         | postcode | country       |
-         | 707         | Upper Kingston Road | Prattville | Autauga County | 36067    | United States |
-
-
-    Scenario: Interpolation address
-        When sending v1/reverse at 47.118533,9.57056562 with format geocodejson
-        Then results contain
-          | osm_type | osm_id | osm_key | osm_value | type  |
-          | way      | 1      | place   | house     | house |
-        And results contain
-          | label |
-          | 1019, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
-        And result has not attributes name
-
-
-    Scenario: Line geometry output is supported
-        When sending v1/reverse at 47.06597,9.50467 with format geocodejson
-          | param           | value |
-          | polygon_geojson | 1     |
-        Then results contain in field geojson
-          | type       |
-          | LineString |
-
-
-    Scenario Outline: Only geojson polygons are supported
-        When sending v1/reverse at 47.06597,9.50467 with format geocodejson
-          | param   | value |
-          | <param> | 1     |
-        Then results contain in field geojson
-          | type  |
-          | Point |
-
-        Examples:
-          | param |
-          | polygon_text |
-          | polygon_svg  |
-          | polygon_kml  |
diff --git a/test/bdd/api/reverse/v1_geojson.feature b/test/bdd/api/reverse/v1_geojson.feature
deleted file mode 100644
index e705529d..00000000
--- a/test/bdd/api/reverse/v1_geojson.feature
+++ /dev/null
@@ -1,73 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Geojson for Reverse API
-    Testing correctness of geojson output (API version v1).
-
-    Scenario Outline: Simple OSM result
-        When sending v1/reverse at 47.066,9.504 with format geojson
-          | addressdetails |
-          | <has_address>  |
-        Then result has attributes place_id, importance, __licence
-        And result has <attributes> address
-        And results contain
-          | osm_type | osm_id     | place_rank | category | type    | addresstype |
-          | node     | 6522627624 | 30         | shop     | bakery  | shop        |
-        And results contain
-          | name                  | display_name |
-          | DorfbÃ¤ckerei Herrmann | DorfbÃ¤ckerei Herrmann, 29, Gnetsch, MÃ¤ls, Balzers, Oberland, 9496, Liechtenstein |
-        And results contain
-          | boundingbox |
-          | [47.0660392, 47.0661392, 9.5035565, 9.5036565] |
-        And results contain in field geojson
-          | type  | coordinates |
-          | Point | [9.5036065, 47.0660892] |
-
-        Examples:
-          | has_address | attributes     |
-          | 1           | attributes     |
-          | 0           | not attributes |
-
-
-    @Tiger
-    Scenario: Tiger address
-        When sending v1/reverse at 32.4752389363,-86.4810198619 with format geojson
-        Then results contain
-         | osm_type | osm_id    | category | type  | addresstype  | place_rank |
-         | way      | 396009653 | place    | house | place        | 30         |
-
-
-    Scenario: Interpolation address
-        When sending v1/reverse at 47.118533,9.57056562 with format geojson
-        Then results contain
-          | osm_type | osm_id | place_rank | category | type    | addresstype |
-          | way      | 1      | 30         | place    | house   | place       |
-        And results contain
-          | boundingbox |
-          | ^\[47.118495\d*, 47.118595\d*, 9.570496\d*, 9.570596\d*\] |
-        And results contain
-          | display_name |
-          | 1019, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
-
-
-    Scenario: Line geometry output is supported
-        When sending v1/reverse at 47.06597,9.50467 with format geojson
-          | param           | value |
-          | polygon_geojson | 1     |
-        Then results contain in field geojson
-          | type       |
-          | LineString |
-
-
-    Scenario Outline: Only geojson polygons are supported
-        When sending v1/reverse at 47.06597,9.50467 with format geojson
-          | param   | value |
-          | <param> | 1     |
-        Then results contain in field geojson
-          | type  |
-          | Point |
-
-        Examples:
-          | param |
-          | polygon_text |
-          | polygon_svg  |
-          | polygon_kml  |
diff --git a/test/bdd/api/reverse/v1_json.feature b/test/bdd/api/reverse/v1_json.feature
deleted file mode 100644
index 1f629c0f..00000000
--- a/test/bdd/api/reverse/v1_json.feature
+++ /dev/null
@@ -1,130 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Json output for Reverse API
-    Testing correctness of json and jsonv2 output (API version v1).
-
-    Scenario Outline: OSM result with and without addresses
-        When sending v1/reverse at 47.066,9.504 with format json
-          | addressdetails |
-          | <has_address>  |
-        Then result has <attributes> address
-        When sending v1/reverse at 47.066,9.504 with format jsonv2
-          | addressdetails |
-          | <has_address>  |
-        Then result has <attributes> address
-
-        Examples:
-          | has_address | attributes     |
-          | 1           | attributes     |
-          | 0           | not attributes |
-
-    Scenario Outline: Simple OSM result
-        When sending v1/reverse at 47.066,9.504 with format <format>
-        Then result has attributes place_id
-        And results contain
-          | licence |
-          | ^Data Â© OpenStreetMap contributors, ODbL 1.0. https?://osm.org/copyright$ |
-        And results contain
-          | osm_type | osm_id     |
-          | node     | 6522627624 |
-        And results contain
-          | centroid             | boundingbox |
-          | 9.5036065 47.0660892 | ['47.0660392', '47.0661392', '9.5035565', '9.5036565'] |
-        And results contain
-          | display_name |
-          | DorfbÃ¤ckerei Herrmann, 29, Gnetsch, MÃ¤ls, Balzers, Oberland, 9496, Liechtenstein |
-        And result has not attributes namedetails,extratags
-
-        Examples:
-          | format |
-          | json   |
-          | jsonv2 |
-
-    Scenario: Extra attributes of jsonv2 result
-        When sending v1/reverse at 47.066,9.504 with format jsonv2
-        Then result has attributes importance
-        Then results contain
-          | category | type   | name                  | place_rank | addresstype |
-          | shop     | bakery | DorfbÃ¤ckerei Herrmann | 30         | shop        |
-
-
-    @Tiger
-    Scenario: Tiger address
-        When sending v1/reverse at 32.4752389363,-86.4810198619 with format jsonv2
-        Then results contain
-         | osm_type | osm_id    | category | type  | addresstype  |
-         | way      | 396009653 | place    | house | place        |
-
-
-    Scenario Outline: Interpolation address
-        When sending v1/reverse at 47.118533,9.57056562 with format <format>
-        Then results contain
-          | osm_type | osm_id |
-          | way      | 1      |
-        And results contain
-          | centroid                | boundingbox |
-          | 9.57054676 47.118545392 | ^\['47.118495\d*', '47.118595\d*', '9.570496\d*', '9.570596\d*'\] |
-        And results contain
-          | display_name |
-          | 1019, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
-
-        Examples:
-          | format |
-          | json   |
-          | jsonv2 |
-
-
-    Scenario Outline: Output of geojson
-       When sending v1/reverse at 47.06597,9.50467 with format <format>
-          | param           | value |
-          | polygon_geojson | 1     |
-       Then results contain in field geojson
-          | type       | coordinates |
-          | LineString | [[9.5039353, 47.0657546], [9.5040437, 47.0657781], [9.5040808, 47.065787], [9.5054298, 47.0661407]] |
-
-       Examples:
-          | format |
-          | json   |
-          | jsonv2 |
-
-
-    Scenario Outline: Output of WKT
-       When sending v1/reverse at 47.06597,9.50467 with format <format>
-          | param        | value |
-          | polygon_text | 1     |
-       Then results contain
-          | geotext |
-          | ^LINESTRING\(9.5039353 47.0657546, ?9.5040437 47.0657781, ?9.5040808 47.065787, ?9.5054298 47.0661407\) |
-
-       Examples:
-          | format |
-          | json   |
-          | jsonv2 |
-
-
-    Scenario Outline: Output of SVG
-       When sending v1/reverse at 47.06597,9.50467 with format <format>
-          | param       | value |
-          | polygon_svg | 1     |
-       Then results contain
-          | svg |
-          | M 9.5039353 -47.0657546 L 9.5040437 -47.0657781 9.5040808 -47.065787 9.5054298 -47.0661407 |
-
-       Examples:
-          | format |
-          | json   |
-          | jsonv2 |
-
-
-    Scenario Outline: Output of KML
-       When sending v1/reverse at 47.06597,9.50467 with format <format>
-          | param       | value |
-          | polygon_kml | 1     |
-       Then results contain
-          | geokml |
-          | ^<LineString><coordinates>9.5039\d*,47.0657\d* 9.5040\d*,47.0657\d* 9.5040\d*,47.065\d* 9.5054\d*,47.0661\d*</coordinates></LineString> |
-
-       Examples:
-          | format |
-          | json   |
-          | jsonv2 |
diff --git a/test/bdd/api/reverse/v1_params.feature b/test/bdd/api/reverse/v1_params.feature
deleted file mode 100644
index 09a190ed..00000000
--- a/test/bdd/api/reverse/v1_params.feature
+++ /dev/null
@@ -1,206 +0,0 @@
-@SQLITE
-@APIDB
-Feature: v1/reverse Parameter Tests
-    Tests for parameter inputs for the v1 reverse endpoint.
-    This file contains mostly bad parameter input. Valid parameters
-    are tested in the format tests.
-
-    Scenario: Bad format
-        When sending v1/reverse at 47.14122383,9.52169581334 with format sdf
-        Then a HTTP 400 is returned
-
-    Scenario: Missing lon parameter
-        When sending v1/reverse at 52.52,
-        Then a HTTP 400 is returned
-
-
-    Scenario: Missing lat parameter
-        When sending v1/reverse at ,52.52
-        Then a HTTP 400 is returned
-
-
-    Scenario Outline: Bad format for lat or lon
-        When sending v1/reverse at ,
-          | lat   | lon   |
-          | <lat> | <lon> |
-        Then a HTTP 400 is returned
-
-        Examples:
-          | lat      | lon |
-          | 48.9660  | 8,4482 |
-          | 48,9660  | 8.4482 |
-          | 48,9660  | 8,4482 |
-          | 48.966.0 | 8.4482 |
-          | 48.966   | 8.448.2 |
-          | Nan      | 8.448  |
-          | 48.966   | Nan    |
-          | Inf      | 5.6    |
-          | 5.6      | -Inf   |
-          | <script></script> | 3.4 |
-          | 3.4 | <script></script> |
-          | -45.3    | ;      |
-          | gkjd     | 50     |
-
-
-    Scenario: Non-numerical zoom levels return an error
-        When sending v1/reverse at 47.14122383,9.52169581334
-          | zoom |
-          | adfe |
-        Then a HTTP 400 is returned
-
-
-    Scenario Outline: Truthy values for boolean parameters
-        When sending v1/reverse at 47.14122383,9.52169581334
-          | addressdetails |
-          | <value> |
-        Then exactly 1 result is returned
-        And result has attributes address
-
-        When sending v1/reverse at 47.14122383,9.52169581334
-          | extratags |
-          | <value> |
-        Then exactly 1 result is returned
-        And result has attributes extratags
-
-        When sending v1/reverse at 47.14122383,9.52169581334
-          | namedetails |
-          | <value> |
-        Then exactly 1 result is returned
-        And result has attributes namedetails
-
-        When sending v1/reverse at 47.14122383,9.52169581334
-          | polygon_geojson |
-          | <value> |
-        Then exactly 1 result is returned
-        And result has attributes geojson
-
-        When sending v1/reverse at 47.14122383,9.52169581334
-          | polygon_kml |
-          | <value> |
-        Then exactly 1 result is returned
-        And result has attributes geokml
-
-        When sending v1/reverse at 47.14122383,9.52169581334
-          | polygon_svg |
-          | <value> |
-        Then exactly 1 result is returned
-        And result has attributes svg
-
-        When sending v1/reverse at 47.14122383,9.52169581334
-          | polygon_text |
-          | <value> |
-        Then exactly 1 result is returned
-        And result has attributes geotext
-
-        Examples:
-          | value |
-          | yes   |
-          | no    |
-          | -1    |
-          | 100   |
-          | false |
-          | 00    |
-
-
-    Scenario: Only one geometry can be requested
-        When sending v1/reverse at 47.165989816710066,9.515774846076965
-          | polygon_text | polygon_svg |
-          | 1            | 1           |
-        Then a HTTP 400 is returned
-
-
-    Scenario Outline: Wrapping of legal jsonp requests
-        When sending v1/reverse at 67.3245,0.456 with format <format>
-          | json_callback |
-          | foo |
-        Then the result is valid <outformat>
-
-        Examples:
-          | format      | outformat   |
-          | json        | json        |
-          | jsonv2      | json        |
-          | geojson     | geojson     |
-          | geocodejson | geocodejson |
-
-
-    Scenario Outline: Illegal jsonp are not allowed
-        When sending v1/reverse at 47.165989816710066,9.515774846076965
-          | param        | value |
-          |json_callback | <data> |
-        Then a HTTP 400 is returned
-
-        Examples:
-          | data |
-          | 1asd |
-          | bar(foo) |
-          | XXX['bad'] |
-          | foo; evil |
-
-
-    Scenario Outline: Reverse debug mode produces valid HTML
-        When sending v1/reverse at , with format debug
-          | lat   | lon   |
-          | <lat> | <lon> |
-        Then the result is valid html
-
-        Examples:
-          | lat      | lon     |
-          | 0.0      | 0.0     |
-          | 47.06645 | 9.56601 |
-          | 47.14081 | 9.52267 |
-
-
-    Scenario Outline: Full address display for city housenumber-level address with street
-        When sending v1/reverse at 47.1068011,9.52810091 with format <format>
-        Then address of result 0 is
-          | type           | value     |
-          | house_number   | 8         |
-          | road           | Im Winkel |
-          | neighbourhood  | Oberdorf  |
-          | village        | Triesen   |
-          | ISO3166-2-lvl8 | LI-09     |
-          | county         | Oberland  |
-          | postcode       | 9495      |
-          | country        | Liechtenstein |
-          | country_code   | li        |
-
-        Examples:
-          | format  |
-          | json    |
-          | jsonv2  |
-          | geojson |
-          | xml     |
-
-
-    Scenario Outline: Results with name details
-        When sending v1/reverse at 47.14052,9.52202 with format <format>
-          | zoom | namedetails |
-          | 14   | 1           |
-        Then results contain in field namedetails
-          | name     |
-          | Ebenholz |
-
-        Examples:
-          | format  |
-          | json    |
-          | jsonv2  |
-          | xml     |
-          | geojson |
-
-
-    Scenario Outline: Results with extratags
-        When sending v1/reverse at 47.14052,9.52202 with format <format>
-          | zoom | extratags |
-          | 14   | 1         |
-        Then results contain in field extratags
-          | wikidata |
-          | Q4529531 |
-
-        Examples:
-          | format |
-          | json   |
-          | jsonv2 |
-          | xml    |
-          | geojson |
-
-
diff --git a/test/bdd/api/reverse/v1_xml.feature b/test/bdd/api/reverse/v1_xml.feature
deleted file mode 100644
index 95e7478c..00000000
--- a/test/bdd/api/reverse/v1_xml.feature
+++ /dev/null
@@ -1,88 +0,0 @@
-@SQLITE
-@APIDB
-Feature: XML output for Reverse API
-    Testing correctness of xml output (API version v1).
-
-    Scenario Outline: OSM result with and without addresses
-        When sending v1/reverse at 47.066,9.504 with format xml
-          | addressdetails |
-          | <has_address>  |
-        Then result has attributes place_id
-        Then result has <attributes> address
-        And results contain
-          | osm_type | osm_id     | place_rank | address_rank |
-          | node     | 6522627624 | 30         | 30           |
-        And results contain
-          | centroid             | boundingbox |
-          | 9.5036065 47.0660892 | 47.0660392,47.0661392,9.5035565,9.5036565 |
-        And results contain
-          | ref                   | display_name |
-          | DorfbÃ¤ckerei Herrmann | DorfbÃ¤ckerei Herrmann, 29, Gnetsch, MÃ¤ls, Balzers, Oberland, 9496, Liechtenstein |
-
-        Examples:
-          | has_address | attributes     |
-          | 1           | attributes     |
-          | 0           | not attributes |
-
-
-    @Tiger
-    Scenario: Tiger address
-        When sending v1/reverse at 32.4752389363,-86.4810198619 with format xml
-        Then results contain
-         | osm_type | osm_id    | place_rank  | address_rank |
-         | way      | 396009653 | 30          | 30           |
-        And results contain
-          | centroid                     | boundingbox |
-          | -86.4808553 32.4753580 | ^32.4753080\d*,32.4754080\d*,-86.4809053\d*,-86.4808053\d* |
-        And results contain
-          | display_name |
-          | 707, Upper Kingston Road, Upper Kingston, Prattville, Autauga County, 36067, United States |
-
-
-    Scenario: Interpolation address
-        When sending v1/reverse at 47.118533,9.57056562 with format xml
-        Then results contain
-          | osm_type | osm_id | place_rank | address_rank |
-          | way      | 1      | 30         | 30           |
-        And results contain
-          | centroid                | boundingbox |
-          | 9.57054676 47.118545392 | ^47.118495\d*,47.118595\d*,9.570496\d*,9.570596\d* |
-        And results contain
-          | display_name |
-          | 1019, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
-
-
-    Scenario: Output of geojson
-       When sending v1/reverse at 47.06597,9.50467 with format xml
-          | param           | value |
-          | polygon_geojson | 1     |
-       Then results contain
-          | geojson |
-          | {"type":"LineString","coordinates":[[9.5039353,47.0657546],[9.5040437,47.0657781],[9.5040808,47.065787],[9.5054298,47.0661407]]}  |
-
-
-    Scenario: Output of WKT
-       When sending v1/reverse at 47.06597,9.50467 with format xml
-          | param        | value |
-          | polygon_text | 1     |
-       Then results contain
-          | geotext |
-          | ^LINESTRING\(9.5039353 47.0657546, ?9.5040437 47.0657781, ?9.5040808 47.065787, ?9.5054298 47.0661407\) |
-
-
-    Scenario: Output of SVG
-       When sending v1/reverse at 47.06597,9.50467 with format xml
-          | param       | value |
-          | polygon_svg | 1     |
-       Then results contain
-          | geosvg |
-          | M 9.5039353 -47.0657546 L 9.5040437 -47.0657781 9.5040808 -47.065787 9.5054298 -47.0661407 |
-
-
-    Scenario: Output of KML
-       When sending v1/reverse at 47.06597,9.50467 with format xml
-          | param       | value |
-          | polygon_kml | 1     |
-       Then results contain
-          | geokml |
-          | ^<geokml><LineString><coordinates>9.5039\d*,47.0657\d* 9.5040\d*,47.0657\d* 9.5040\d*,47.065\d* 9.5054\d*,47.0661\d*</coordinates></LineString></geokml> |
diff --git a/test/bdd/api/search/geocodejson.feature b/test/bdd/api/search/geocodejson.feature
deleted file mode 100644
index 271ec10c..00000000
--- a/test/bdd/api/search/geocodejson.feature
+++ /dev/null
@@ -1,28 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Parameters for Search API
-    Testing correctness of geocodejson output.
-
-    Scenario: City housenumber-level address with street
-        When sending geocodejson search query "Im Winkel 8, Triesen" with address
-        Then results contain
-          | housenumber | street    | postcode | city    | country |
-          | 8           | Im Winkel | 9495     | Triesen | Liechtenstein |
-
-    Scenario: Town street-level address with street
-        When sending geocodejson search query "Gnetsch, Balzers" with address
-        Then results contain
-          | name    | city    | postcode | country |
-          | Gnetsch | Balzers | 9496     | Liechtenstein |
-
-    Scenario: Town street-level address with footway
-        When sending geocodejson search query "burg gutenberg 6000 jahre geschichte" with address
-        Then results contain
-          | street  | city    | postcode | country |
-          | Burgweg | Balzers | 9496     | Liechtenstein |
-
-    Scenario: City address with suburb
-        When sending geocodejson search query "Lochgass 5, Ebenholz, Vaduz" with address
-        Then results contain
-          | housenumber | street   | district | city  | postcode | country |
-          | 5           | Lochgass | Ebenholz | Vaduz | 9490     | Liechtenstein |
diff --git a/test/bdd/api/search/language.feature b/test/bdd/api/search/language.feature
deleted file mode 100644
index fe14cdbe..00000000
--- a/test/bdd/api/search/language.feature
+++ /dev/null
@@ -1,63 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Localization of search results
-
-    Scenario: default language
-        When sending json search query "Liechtenstein"
-        Then results contain
-          | ID | display_name |
-          | 0  | Liechtenstein |
-
-    Scenario: accept-language first
-        When sending json search query "Liechtenstein"
-          | accept-language |
-          | zh,de |
-        Then results contain
-          | ID | display_name |
-          | 0  | åæ¯æ¦å£«ç» |
-
-    Scenario: accept-language missing
-        When sending json search query "Liechtenstein"
-          | accept-language |
-          | xx,fr,en,de |
-        Then results contain
-          | ID | display_name |
-          | 0  | Liechtenstein |
-
-    Scenario: http accept language header first
-        Given the HTTP header
-          | accept-language |
-          | fo;q=0.8,en-ca;q=0.5,en;q=0.3 |
-        When sending json search query "Liechtenstein"
-        Then results contain
-          | ID | display_name |
-          | 0  | Liktinstein |
-
-    Scenario: http accept language header and accept-language
-        Given the HTTP header
-          | accept-language |
-          | fr-ca,fr;q=0.8,en-ca;q=0.5,en;q=0.3 |
-        When sending json search query "Liechtenstein"
-          | accept-language |
-          | fo,en |
-        Then results contain
-          | ID | display_name |
-          | 0  | Liktinstein |
-
-    Scenario: http accept language header fallback
-        Given the HTTP header
-          | accept-language |
-          | fo-ca,en-ca;q=0.5 |
-        When sending json search query "Liechtenstein"
-        Then results contain
-          | ID | display_name |
-          | 0  | Liktinstein |
-
-    Scenario: http accept language header fallback (upper case)
-        Given the HTTP header
-          | accept-language |
-          | fo-FR;q=0.8,en-ca;q=0.5 |
-        When sending json search query "Liechtenstein"
-        Then results contain
-          | ID | display_name |
-          | 0  | Liktinstein |
diff --git a/test/bdd/api/search/params.feature b/test/bdd/api/search/params.feature
deleted file mode 100644
index e77a00d2..00000000
--- a/test/bdd/api/search/params.feature
+++ /dev/null
@@ -1,362 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Search queries
-    Testing different queries and parameters
-
-    Scenario: Simple XML search
-        When sending xml search query "Schaan"
-        Then result 0 has attributes place_id,osm_type,osm_id
-        And result 0 has attributes place_rank,boundingbox
-        And result 0 has attributes lat,lon,display_name
-        And result 0 has attributes class,type,importance
-        And result 0 has not attributes address
-        And result 0 has bounding box in 46.5,47.5,9,10
-
-    Scenario: Simple JSON search
-        When sending json search query "Vaduz"
-        Then result 0 has attributes place_id,licence,class,type
-        And result 0 has attributes osm_type,osm_id,boundingbox
-        And result 0 has attributes lat,lon,display_name,importance
-        And result 0 has not attributes address
-        And result 0 has bounding box in 46.5,47.5,9,10
-
-    Scenario: Unknown formats returns a user error
-        When sending search query "Vaduz"
-          | format |
-          | x45    |
-        Then a HTTP 400 is returned
-
-    Scenario Outline: Search with addressdetails
-        When sending <format> search query "Triesen" with address
-        Then address of result 0 is
-          | type         | value |
-          | village      | Triesen |
-          | county       | Oberland |
-          | postcode     | 9495 |
-          | country      | Liechtenstein |
-          | country_code | li |
-          | ISO3166-2-lvl8 | LI-09 |
-
-    Examples:
-          | format |
-          | json   |
-          | jsonv2 |
-          | geojson |
-          | xml |
-
-    Scenario: Coordinate search with addressdetails
-        When sending json search query "47.12400621,9.6047552"
-          | accept-language |
-          | en |
-        Then results contain
-          | display_name |
-          | Guschg, Valorschstrasse, Balzers, Oberland, 9497, Liechtenstein |
-
-    Scenario: Address details with unknown class types
-        When sending json search query "Kloster St. Elisabeth" with address
-        Then results contain
-          | ID | class   | type |
-          | 0  | amenity | monastery |
-        And result addresses contain
-          | ID | amenity |
-          | 0  | Kloster St. Elisabeth |
-
-    Scenario: Disabling deduplication
-        When sending json search query "Malbunstr"
-        Then there are no duplicates
-        When sending json search query "Malbunstr"
-          | dedupe |
-          | 0 |
-        Then there are duplicates
-
-    Scenario: Search with bounded viewbox in right area
-        When sending json search query "post" with address
-          | bounded | viewbox |
-          | 1       |  9,47,10,48 |
-        Then result addresses contain
-          | ID | town |
-          | 0  | Vaduz |
-        When sending json search query "post" with address
-          | bounded | viewbox |
-          | 1       |  9.49712,47.17122,9.52605,47.16242 |
-        Then result addresses contain
-          | town |
-          | Schaan |
-
-    Scenario: Country search with bounded viewbox remain in the area
-        When sending json search query "" with address
-          | bounded | viewbox                                 | country |
-          | 1       | 9.49712,47.17122,9.52605,47.16242 | de |
-        Then less than 1 result is returned
-
-    Scenario: Search with bounded viewboxlbrt in right area
-        When sending json search query "bar" with address
-          | bounded | viewboxlbrt |
-          | 1       | 9.49712,47.16242,9.52605,47.17122 |
-        Then result addresses contain
-          | town |
-          | Schaan |
-
-    @Fail
-    Scenario: No POI search with unbounded viewbox
-        When sending json search query "restaurant"
-          | viewbox |
-          | 9.93027,53.61634,10.10073,53.54500 |
-        Then results contain
-          | display_name |
-          | ^[^,]*[Rr]estaurant.* |
-
-    Scenario: bounded search remains within viewbox, even with no results
-         When sending json search query "[restaurant]"
-           | bounded | viewbox |
-           | 1       | 43.5403125,-5.6563282,43.54285,-5.662003 |
-        Then less than 1 result is returned
-
-    Scenario: bounded search remains within viewbox with results
-        When sending json search query "restaurant"
-         | bounded | viewbox |
-         | 1       | 9.49712,47.17122,9.52605,47.16242 |
-        Then result has centroid in 9.49712,47.16242,9.52605,47.17122
-
-    Scenario: Prefer results within viewbox
-        When sending json search query "GÃ¤ssle" with address
-          | accept-language | viewbox |
-          | en              | 9.52413,47.10759,9.53140,47.10539 |
-        Then result addresses contain
-          | ID | village |
-          | 0  | Triesen |
-        When sending json search query "GÃ¤ssle" with address
-          | accept-language | viewbox |
-          | en              | 9.45949,47.08421,9.54094,47.05466 |
-        Then result addresses contain
-          | ID | town |
-          | 0  | Balzers |
-
-    Scenario: viewboxes cannot be points
-        When sending json search query "foo"
-          | viewbox |
-          | 1.01,34.6,1.01,34.6 |
-        Then a HTTP 400 is returned
-
-    Scenario Outline: viewbox must have four coordinate numbers
-        When sending json search query "foo"
-          | viewbox |
-          | <viewbox> |
-        Then a HTTP 400 is returned
-
-    Examples:
-        | viewbox |
-        | 34      |
-        | 0.003,-84.4 |
-        | 5.2,4.5542,12.4 |
-        | 23.1,-6,0.11,44.2,9.1 |
-
-    Scenario Outline: viewboxlbrt must have four coordinate numbers
-        When sending json search query "foo"
-          | viewboxlbrt |
-          | <viewbox> |
-        Then a HTTP 400 is returned
-
-    Examples:
-        | viewbox |
-        | 34      |
-        | 0.003,-84.4 |
-        | 5.2,4.5542,12.4 |
-        | 23.1,-6,0.11,44.2,9.1 |
-
-    Scenario: Overly large limit number for search results
-        When sending json search query "restaurant"
-          | limit |
-          | 1000 |
-        Then at most 50 results are returned
-
-    Scenario: Limit number of search results
-        When sending json search query "landstr"
-          | dedupe |
-          | 0      |
-        Then more than 4 results are returned
-        When sending json search query "landstr"
-          | limit | dedupe |
-          | 4     | 0      |
-        Then exactly 4 results are returned
-
-    Scenario: Limit parameter must be a number
-        When sending search query "Blue Laguna"
-          | limit |
-          | );    |
-        Then a HTTP 400 is returned
-
-    Scenario: Restrict to feature type country
-        When sending xml search query "fÃ¼rstentum"
-          | featureType |
-          | country |
-        Then results contain
-          | place_rank |
-          | 4 |
-
-    Scenario: Restrict to feature type state
-        When sending xml search query "Wangerberg"
-        Then at least 1 result is returned
-        When sending xml search query "Wangerberg"
-          | featureType |
-          | state |
-        Then exactly 0 results are returned
-
-    Scenario: Restrict to feature type city
-        When sending xml search query "vaduz"
-        Then at least 1 result is returned
-        When sending xml search query "vaduz"
-          | featureType |
-          | city |
-        Then results contain
-          | place_rank |
-          | 16 |
-
-    Scenario: Restrict to feature type settlement
-        When sending json search query "Malbun"
-        Then results contain
-          | ID | class |
-          | 1  | landuse |
-        When sending json search query "Malbun"
-          | featureType |
-          | settlement |
-        Then results contain
-          | class | type |
-          | place | village |
-
-    Scenario Outline: Search with polygon threshold (json)
-        When sending json search query "triesenberg"
-          | polygon_geojson | polygon_threshold |
-          | 1               | <th> |
-        Then at least 1 result is returned
-        And result 0 has attributes geojson
-
-     Examples:
-        | th |
-        | -1 |
-        | 0.0 |
-        | 0.5 |
-        | 999 |
-
-    Scenario Outline: Search with polygon threshold (xml)
-        When sending xml search query "triesenberg"
-          | polygon_geojson | polygon_threshold |
-          | 1               | <th> |
-        Then at least 1 result is returned
-        And result 0 has attributes geojson
-
-     Examples:
-        | th |
-        | -1 |
-        | 0.0 |
-        | 0.5 |
-        | 999 |
-
-    Scenario Outline: Search with invalid polygon threshold (xml)
-        When sending xml search query "triesenberg"
-          | polygon_geojson | polygon_threshold |
-          | 1               | <th> |
-        Then a HTTP 400 is returned
-
-     Examples:
-        | th |
-        | x |
-        | ;; |
-        | 1m |
-
-    Scenario Outline: Search with extratags
-        When sending <format> search query "Landstr"
-          | extratags |
-          | 1 |
-        Then result has attributes extratags
-
-    Examples:
-        | format |
-        | xml |
-        | json |
-        | jsonv2 |
-        | geojson |
-
-    Scenario Outline: Search with namedetails
-        When sending <format> search query "Landstr"
-          | namedetails |
-          | 1 |
-        Then result has attributes namedetails
-
-    Examples:
-        | format |
-        | xml |
-        | json |
-        | jsonv2 |
-        | geojson |
-
-    Scenario Outline: Search result with contains TEXT geometry
-        When sending <format> search query "triesenberg"
-          | polygon_text |
-          | 1 |
-        Then result has attributes <response_attribute>
-
-    Examples:
-        | format   | response_attribute |
-        | xml      | geotext |
-        | json     | geotext |
-        | jsonv2   | geotext |
-
-    Scenario Outline: Search result contains SVG geometry
-        When sending <format> search query "triesenberg"
-          | polygon_svg |
-          | 1 |
-        Then result has attributes <response_attribute>
-
-    Examples:
-        | format   | response_attribute |
-        | xml      | geosvg |
-        | json     | svg |
-        | jsonv2   | svg |
-
-    Scenario Outline: Search result contains KML geometry
-        When sending <format> search query "triesenberg"
-          | polygon_kml |
-          | 1 |
-        Then result has attributes <response_attribute>
-
-    Examples:
-        | format   | response_attribute |
-        | xml      | geokml |
-        | json     | geokml |
-        | jsonv2   | geokml |
-
-    Scenario Outline: Search result contains GEOJSON geometry
-        When sending <format> search query "triesenberg"
-          | polygon_geojson |
-          | 1 |
-        Then result has attributes <response_attribute>
-
-    Examples:
-        | format   | response_attribute |
-        | xml      | geojson |
-        | json     | geojson |
-        | jsonv2   | geojson |
-        | geojson  | geojson |
-
-    Scenario Outline: Search result in geojson format contains no non-geojson geometry
-        When sending geojson search query "triesenberg"
-          | polygon_text | polygon_svg | polygon_geokml |
-          | 1            | 1           | 1              |
-        Then result 0 has not attributes <response_attribute>
-
-    Examples:
-        | response_attribute |
-        | geotext            |
-        | polygonpoints      |
-        | svg                |
-        | geokml             |
-
-
-    Scenario: Array parameters are ignored
-        When sending json search query "Vaduz" with address
-          | countrycodes[] | polygon_svg[] | limit[] | polygon_threshold[] |
-          | IT             | 1             | 3       | 3.4                 |
-        Then result addresses contain
-          | ID | country_code |
-          | 0  | li           |
diff --git a/test/bdd/api/search/queries.feature b/test/bdd/api/search/queries.feature
deleted file mode 100644
index 6e640acc..00000000
--- a/test/bdd/api/search/queries.feature
+++ /dev/null
@@ -1,221 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Search queries
-    Generic search result correctness
-
-    Scenario: Search for natural object
-        When sending json search query "Samina"
-          | accept-language |
-          | en |
-        Then results contain
-          | ID | class    | type  | display_name    |
-          | 0  | waterway | river | Samina, Austria |
-
-    Scenario: House number search for non-street address
-        When sending json search query "6 Silum, Liechtenstein" with address
-          | accept-language |
-          | en |
-        Then address of result 0 is
-          | type         | value |
-          | house_number | 6 |
-          | village      | Silum |
-          | town         | Triesenberg |
-          | county       | Oberland |
-          | postcode     | 9497 |
-          | country      | Liechtenstein |
-          | country_code | li |
-          | ISO3166-2-lvl8  | LI-10 |
-
-    Scenario: House number interpolation
-        When sending json search query "Grosssteg 1023, Triesenberg" with address
-          | accept-language |
-          | de |
-        Then address of result 0 contains
-          | type          | value |
-          | house_number  | 1023 |
-          | road          | Grosssteg |
-          | village       | SÃ¼cka |
-          | postcode      | 9497 |
-          | town          | Triesenberg |
-          | country       | Liechtenstein |
-          | country_code  | li |
-
-    Scenario: With missing housenumber search falls back to road
-        When sending json search query "BÃ¼ndaweg 555" with address
-        Then address of result 0 is
-          | type          | value |
-          | road          | BÃ¼ndaweg |
-          | village       | Silum |
-          | postcode      | 9497 |
-          | county        | Oberland |
-          | town          | Triesenberg |
-          | country       | Liechtenstein |
-          | country_code  | li |
-          | ISO3166-2-lvl8  | LI-10 |
-
-    Scenario Outline: Housenumber 0 can be found
-        When sending <format> search query "Gnalpstrasse 0" with address
-        Then results contain
-          | display_name |
-          | ^0,.* |
-        And result addresses contain
-          | house_number |
-          | 0     |
-
-    Examples:
-        | format |
-        | xml |
-        | json |
-        | jsonv2 |
-        | geojson |
-
-    @Tiger
-    Scenario: TIGER house number
-        When sending json search query "697 Upper Kingston Road"
-        Then results contain
-         | osm_type | display_name |
-         | way      | ^697,.* |
-
-    Scenario: Search with class-type feature
-        When sending jsonv2 search query "bars in ebenholz"
-        Then results contain
-          | place_rank |
-          | 30 |
-
-    Scenario: Search with specific amenity
-        When sending json search query "[restaurant] Vaduz" with address
-        Then result addresses contain
-          | country |
-          | Liechtenstein |
-        And  results contain
-          | class   | type |
-          | amenity | restaurant |
-
-    Scenario: Search with specific amenity also work in country
-        When sending json search query "restaurants in liechtenstein" with address
-        Then result addresses contain
-          | country |
-          | Liechtenstein |
-        And  results contain
-          | class   | type |
-          | amenity | restaurant |
-
-    Scenario: Search with key-value amenity
-        When sending json search query "[club=scout] Vaduz"
-        Then results contain
-          | class | type |
-          | club  | scout |
-
-    Scenario: POI search near given coordinate
-        When sending json search query "restaurant near 47.16712,9.51100"
-        Then results contain
-          | class   | type |
-          | amenity | restaurant |
-
-    Scenario: Arbitrary key/value search near given coordinate
-        When sending json search query "[leisure=firepit]   47.150Â° N 9.5340493Â° E"
-        Then results contain
-          | class   | type |
-          | leisure | firepit |
-
-
-    Scenario: POI search in a bounded viewbox
-        When sending json search query "restaurants"
-          | viewbox                           | bounded |
-          | 9.50830,47.15253,9.52043,47.14866 | 1 |
-        Then results contain
-          | class   | type       |
-          | amenity | restaurant |
-
-    Scenario Outline: Key/value search near given coordinate can be restricted to country
-        When sending json search query "[natural=peak] 47.06512,9.53965" with address
-          | countrycodes |
-          | <cc> |
-        Then result addresses contain
-          | country_code |
-          | <cc> |
-
-    Examples:
-        | cc |
-        | li |
-        | ch |
-
-    Scenario: Name search near given coordinate
-        When sending json search query "sporry" with address
-        Then result addresses contain
-          | ID | town |
-          | 0  | Vaduz |
-        When sending json search query "sporry, 47.10791,9.52676" with address
-        Then result addresses contain
-          | ID | village |
-          | 0  | Triesen |
-
-    Scenario: Name search near given coordinate without result
-        When sending json search query "sporry, N 47 15 7 W 9 61 26"
-        Then exactly 0 results are returned
-
-    Scenario: Arbitrary key/value search near a road
-        When sending json search query "[amenity=drinking_water] WissflÃ¤ckaweg"
-        Then results contain
-          | class   | type |
-          | amenity | drinking_water |
-
-    Scenario: Ignore other country codes in structured search with country
-        When sending json search query ""
-            | city | country |
-            | li   | de      |
-        Then exactly 0 results are returned
-
-    Scenario: Ignore country searches when query is restricted to countries
-        When sending json search query "fr"
-            | countrycodes |
-            | li  |
-        Then exactly 0 results are returned
-
-    Scenario: Country searches only return results for the given country
-        When sending search query "Ans Trail" with address
-            | countrycodes |
-            | li |
-        Then result addresses contain
-            | country_code |
-            | li |
-
-    # https://trac.openstreetmap.org/ticket/5094
-    Scenario: housenumbers are ordered by complete match first
-        When sending json search query "Austrasse 11, Vaduz" with address
-        Then result addresses contain
-          | ID | house_number |
-          | 0  | 11 |
-
-    Scenario Outline: Coordinate searches with white spaces
-        When sending json search query "<data>"
-        Then exactly 1 result is returned
-        And results contain
-          | class   |
-          | natural |
-
-    Examples:
-      | data |
-      | sporry weiher, N 47.10791Â° E 9.52676Â° |
-      | sporry weiher,	N 47.10791Â° E 9.52676Â° |
-      | 	sporry weiher	, 	N 47.10791Â° E 9.52676Â° |
-      | sporry weiher, N 47.10791Â° 		E 9.52676Â° |
-      | sporry weiher, N 47.10791Â° E	9.52676Â° |
-
-    Scenario: Searches with white spaces
-        When sending json search query "52	Bodastr,Triesenberg"
-        Then results contain
-          | class   | type |
-          | highway | residential |
-
-
-    # github #1949
-    Scenario: Addressdetails always return the place type
-       When sending json search query "Vaduz" with address
-       Then result addresses contain
-         | ID | town |
-         | 0  | Vaduz |
-
-    Scenario: Search can handle complex query word sets
-       When sending search query "aussenstelle universitat lichtenstein wachterhaus aussenstelle universitat lichtenstein wachterhaus aussenstelle universitat lichtenstein wachterhaus aussenstelle universitat lichtenstein wachterhaus"
-       Then a HTTP 200 is returned
diff --git a/test/bdd/api/search/simple.feature b/test/bdd/api/search/simple.feature
deleted file mode 100644
index 655c639b..00000000
--- a/test/bdd/api/search/simple.feature
+++ /dev/null
@@ -1,208 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Simple Tests
-    Simple tests for internal server errors and response format.
-
-    Scenario Outline: Testing different parameters
-        When sending search query "Vaduz"
-          | param       | value   |
-          | <parameter> | <value> |
-        Then at least 1 result is returned
-        When sending xml search query "Vaduz"
-          | param       | value   |
-          | <parameter> | <value> |
-        Then at least 1 result is returned
-        When sending json search query "Vaduz"
-          | param       | value   |
-          | <parameter> | <value> |
-        Then at least 1 result is returned
-        When sending jsonv2 search query "Vaduz"
-          | param       | value   |
-          | <parameter> | <value> |
-        Then at least 1 result is returned
-        When sending geojson search query "Vaduz"
-          | param       | value   |
-          | <parameter> | <value> |
-        Then at least 1 result is returned
-        When sending geocodejson search query "Vaduz"
-          | param       | value   |
-          | <parameter> | <value> |
-        Then at least 1 result is returned
-
-    Examples:
-     | parameter        | value |
-     | addressdetails   | 0 |
-     | polygon_text     | 0 |
-     | polygon_kml      | 0 |
-     | polygon_geojson  | 0 |
-     | polygon_svg      | 0 |
-     | accept-language  | de,en |
-     | countrycodes     | li |
-     | bounded          | 1 |
-     | bounded          | 0 |
-     | exclude_place_ids| 385252,1234515 |
-     | limit            | 1000 |
-     | dedupe           | 1 |
-     | dedupe           | 0 |
-     | extratags        | 0 |
-     | namedetails      | 0 |
-
-    Scenario: Search with invalid output format
-        When sending search query "Berlin"
-          | format |
-          | fd$# |
-        Then a HTTP 400 is returned
-
-    Scenario Outline: Simple Searches
-        When sending search query "<query>"
-        Then the result is valid json
-        When sending xml search query "<query>"
-        Then the result is valid xml
-        When sending json search query "<query>"
-        Then the result is valid json
-        When sending jsonv2 search query "<query>"
-        Then the result is valid json
-        When sending geojson search query "<query>"
-        Then the result is valid geojson
-
-    Examples:
-     | query |
-     | New York, New York |
-     | France |
-     | 12, Main Street, Houston |
-     | MÃ¼nchen |
-     | æ±äº¬é½ |
-     | hotels in nantes |
-     | xywxkrf |
-     | gh; foo() |
-     | %#$@*&l;der#$! |
-     | 234 |
-     | 47.4,8.3 |
-
-    Scenario: Empty XML search
-        When sending xml search query "xnznxvcx"
-        Then result header contains
-          | attr        | value |
-          | querystring | xnznxvcx |
-          | more_url    | .*q=xnznxvcx.*format=xml |
-
-    Scenario: Empty XML search with special XML characters
-        When sending xml search query "xfdghn&zxn"xvbyx<vxx>cssdex"
-        Then result header contains
-          | attr        | value |
-          | querystring | xfdghn&zxn"xvbyx<vxx>cssdex |
-          | more_url    | .*q=xfdghn%26zxn%22xvbyx%3Cvxx%3Ecssdex.*format=xml |
-
-    Scenario: Empty XML search with viewbox
-        When sending xml search query "xnznxvcx"
-          | viewbox |
-          | 12,33,77,45.13 |
-        Then result header contains
-          | attr        | value |
-          | querystring | xnznxvcx |
-          | viewbox     | 12,33,77,45.13 |
-
-    Scenario: Empty XML search with viewboxlbrt
-        When sending xml search query "xnznxvcx"
-          | viewboxlbrt |
-          | 12,34.13,77,45 |
-        Then result header contains
-          | attr        | value |
-          | querystring | xnznxvcx |
-          | viewbox     | 12,34.13,77,45 |
-
-    Scenario: Empty XML search with viewboxlbrt and viewbox
-        When sending xml search query "pub"
-          | viewbox        | viewboxblrt |
-          | 12,33,77,45.13 | 1,2,3,4 |
-        Then result header contains
-          | attr        | value |
-          | querystring | pub |
-          | viewbox     | 12,33,77,45.13 |
-
-    Scenario: Empty XML search with excluded place ids
-        When sending xml search query "jghrleoxsbwjer"
-          | exclude_place_ids |
-          | 123,76,342565 |
-        Then result header contains
-          | attr              | value |
-          | exclude_place_ids | 123,76,342565 |
-
-    Scenario: Empty XML search with bad excluded place ids
-        When sending xml search query "jghrleoxsbwjer"
-          | exclude_place_ids |
-          | , |
-        Then result header has not attributes exclude_place_ids
-
-    Scenario Outline: Wrapping of legal jsonp search requests
-        When sending json search query "Tokyo"
-            | param        | value |
-            |json_callback | <data> |
-        Then result header contains
-            | attr         | value |
-            | json_func    | <result> |
-
-    Examples:
-     | data    | result |
-     | foo     | foo |
-     | FOO     | FOO |
-     | __world | __world |
-
-    Scenario Outline: Wrapping of illegal jsonp search requests
-        When sending json search query "Tokyo"
-            | param        | value |
-            |json_callback | <data> |
-        Then a json user error is returned
-
-    Examples:
-      | data |
-      | 1asd |
-      | bar(foo) |
-      | XXX['bad'] |
-      | foo; evil |
-
-    Scenario: Ignore jsonp parameter for anything but json
-        When sending json search query "Malibu"
-          | json_callback |
-          | 234 |
-        Then a HTTP 400 is returned
-        When sending xml search query "Malibu"
-          | json_callback |
-          | 234 |
-        Then the result is valid xml
-
-    Scenario Outline: Empty search
-        When sending <format> search query "YHlERzzx"
-        Then exactly 0 results are returned
-
-    Examples:
-        | format |
-        | json |
-        | jsonv2 |
-        | geojson |
-        | geocodejson |
-
-    Scenario: Search for non-existing coordinates
-        When sending json search query "-21.0,-33.0"
-        Then exactly 0 results are returned
-
-    Scenario: Country code selection is retained in more URL (#596)
-        When sending xml search query "Vaduz"
-          | countrycodes |
-          | pl,1,,invalid,undefined,%3Cb%3E,bo,, |
-        Then result header contains
-          | attr     | value |
-          | more_url | .*&countrycodes=pl%2Cbo&.* |
-
-    Scenario Outline: Search debug output does not return errors
-        When sending debug search query "<query>"
-        Then a HTTP 200 is returned
-
-    Examples:
-        | query |
-        | Liechtenstein |
-        | Triesen |
-        | Pfarrkirche |
-        | Landstr 27 Steinort, Triesenberg, 9495 |
-        | 9497 |
-        | restaurant in triesen |
diff --git a/test/bdd/api/search/structured.feature b/test/bdd/api/search/structured.feature
deleted file mode 100644
index a1dd5b83..00000000
--- a/test/bdd/api/search/structured.feature
+++ /dev/null
@@ -1,69 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Structured search queries
-    Testing correctness of results with
-    structured queries
-
-    Scenario: Country only
-        When sending json search query "" with address
-          | country |
-          | Liechtenstein |
-        Then address of result 0 is
-          | type         | value |
-          | country      | Liechtenstein |
-          | country_code | li |
-
-    Scenario: Postcode only
-        When sending json search query "" with address
-          | postalcode |
-          | 9495 |
-        Then results contain
-          | type |
-          | ^post(al_)?code |
-        And result addresses contain
-          | postcode |
-          | 9495 |
-
-    Scenario: Street, postcode and country
-        When sending xml search query "" with address
-          | street          | postalcode | country |
-          | Old Palace Road | GU2 7UP    | United Kingdom |
-        Then result header contains
-          | attr        | value |
-          | querystring | Old Palace Road, GU2 7UP, United Kingdom |
-
-    Scenario: Street with housenumber, city and postcode
-        When sending xml search query "" with address
-          | street             | city  | postalcode |
-          | 19 Am schrÃ¤gen Weg | Vaduz | 9490       |
-        Then result addresses contain
-          | house_number | road |
-          | 19           | Am SchrÃ¤gen Weg |
-
-    Scenario: Street with housenumber, city and bad postcode
-        When sending xml search query "" with address
-          | street             | city  | postalcode |
-          | 19 Am schrÃ¤gen Weg | Vaduz | 9491       |
-        Then result addresses contain
-          | house_number | road |
-          | 19           | Am SchrÃ¤gen Weg |
-
-    Scenario: Amenity, city
-        When sending json search query "" with address
-          | city  | amenity |
-          | Vaduz | bar  |
-        Then result addresses contain
-          | country |
-          | Liechtenstein |
-        And  results contain
-          | class   | type |
-          | amenity | ^(pub)\|(bar)\|(restaurant) |
-
-    #176
-    Scenario: Structured search restricts rank
-        When sending json search query "" with address
-          | city |
-          | Vaduz |
-        Then result addresses contain
-          | town |
-          | Vaduz |
diff --git a/test/bdd/api/status/failures.feature b/test/bdd/api/status/failures.feature
deleted file mode 100644
index 70e9589a..00000000
--- a/test/bdd/api/status/failures.feature
+++ /dev/null
@@ -1,17 +0,0 @@
-@UNKNOWNDB
-Feature: Status queries against unknown database
-    Testing status query
-
-    Scenario: Failed status as text
-        When sending text status query
-        Then a HTTP 500 is returned
-        And the page contents equals "ERROR: Database connection failed"
-
-    Scenario: Failed status as json
-        When sending json status query
-        Then a HTTP 200 is returned
-        And the result is valid json
-        And results contain
-          | status | message |
-          | 700    | Database connection failed |
-        And result has not attributes data_updated
diff --git a/test/bdd/api/status/simple.feature b/test/bdd/api/status/simple.feature
deleted file mode 100644
index 993fa1ec..00000000
--- a/test/bdd/api/status/simple.feature
+++ /dev/null
@@ -1,17 +0,0 @@
-@SQLITE
-@APIDB
-Feature: Status queries
-    Testing status query
-
-    Scenario: Status as text
-        When sending status query
-        Then a HTTP 200 is returned
-        And the page contents equals "OK"
-
-    Scenario: Status as json
-        When sending json status query
-        Then the result is valid json
-        And results contain
-          | status | message |
-          | 0      | OK      |
-        And result has attributes data_updated
diff --git a/test/bdd/conftest.py b/test/bdd/conftest.py
new file mode 100644
index 00000000..6d2b0b69
--- /dev/null
+++ b/test/bdd/conftest.py
@@ -0,0 +1,358 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Fixtures for BDD test steps
+"""
+import sys
+import json
+from pathlib import Path
+
+import psycopg
+from psycopg import sql as pysql
+
+# always test against the source
+SRC_DIR = (Path(__file__) / '..' / '..' / '..').resolve()
+sys.path.insert(0, str(SRC_DIR / 'src'))
+
+import pytest
+from pytest_bdd.parsers import re as step_parse
+from pytest_bdd import given, when, then
+
+pytest.register_assert_rewrite('utils')
+
+from utils.api_runner import APIRunner
+from utils.api_result import APIResult
+from utils.checks import ResultAttr, COMPARATOR_TERMS
+from utils.geometry_alias import ALIASES
+from utils.grid import Grid
+from utils.db import DBManager
+
+from nominatim_db.config import Configuration
+from nominatim_db.data.country_info import setup_country_config
+
+
+def _strlist(inp):
+    return [s.strip() for s in inp.split(',')]
+
+
+def _pretty_json(inp):
+    return json.dumps(inp, indent=2)
+
+
+def pytest_addoption(parser, pluginmanager):
+    parser.addoption('--nominatim-purge', dest='NOMINATIM_PURGE', action='store_true',
+                     help='Force recreation of test databases from scratch.')
+    parser.addoption('--nominatim-keep-db', dest='NOMINATIM_KEEP_DB', action='store_true',
+                     help='Do not drop the database after tests are finished.')
+    parser.addoption('--nominatim-api-engine', dest='NOMINATIM_API_ENGINE',
+                     default='falcon',
+                     help='Chose the API engine to use when sending requests.')
+    parser.addoption('--nominatim-tokenizer', dest='NOMINATIM_TOKENIZER',
+                     metavar='TOKENIZER',
+                     help='Use the specified tokenizer for importing data into '
+                          'a Nominatim database.')
+
+    parser.addini('nominatim_test_db', default='test_nominatim',
+                  help='Name of the database used for running a single test.')
+    parser.addini('nominatim_api_test_db', default='test_api_nominatim',
+                  help='Name of the database for storing API test data.')
+    parser.addini('nominatim_template_db', default='test_template_nominatim',
+                  help='Name of database used as a template for test databases.')
+
+
+@pytest.fixture
+def datatable():
+    """ Default fixture for datatables, so that their presence can be optional.
+    """
+    return None
+
+
+@pytest.fixture
+def node_grid():
+    """ Default fixture for node grids. Nothing set.
+    """
+    return Grid([[]], None, None)
+
+
+@pytest.fixture(scope='session', autouse=True)
+def setup_country_info():
+    setup_country_config(Configuration(None))
+
+
+@pytest.fixture(scope='session')
+def template_db(pytestconfig):
+    """ Create a template database containing the extensions and base data
+        needed by Nominatim. Using the template instead of doing the full
+        setup can speed up the tests.
+
+        The template database will only be created if it does not exist yet
+        or a purge has been explicitly requested.
+    """
+    dbm = DBManager(purge=pytestconfig.option.NOMINATIM_PURGE)
+
+    template_db = pytestconfig.getini('nominatim_template_db')
+
+    template_config = Configuration(
+        None, environ={'NOMINATIM_DATABASE_DSN': f"pgsql:dbname={template_db}"})
+
+    dbm.setup_template_db(template_config)
+
+    return template_db
+
+
+@pytest.fixture
+def def_config(pytestconfig):
+    dbname = pytestconfig.getini('nominatim_test_db')
+
+    return Configuration(None,
+                         environ={'NOMINATIM_DATABASE_DSN': f"pgsql:dbname={dbname}"})
+
+
+@pytest.fixture
+def db(template_db, pytestconfig):
+    """ Set up an empty database for use with osm2pgsql.
+    """
+    dbm = DBManager(purge=pytestconfig.option.NOMINATIM_PURGE)
+
+    dbname = pytestconfig.getini('nominatim_test_db')
+
+    dbm.create_db_from_template(dbname, template_db)
+
+    yield dbname
+
+    if not pytestconfig.option.NOMINATIM_KEEP_DB:
+        dbm.drop_db(dbname)
+
+
+@pytest.fixture
+def db_conn(db, def_config):
+    with psycopg.connect(def_config.get_libpq_dsn()) as conn:
+        info = psycopg.types.TypeInfo.fetch(conn, "hstore")
+        psycopg.types.hstore.register_hstore(info, conn)
+        yield conn
+
+
+@when(step_parse(r'reverse geocoding (?P<lat>[\d.-]*),(?P<lon>[\d.-]*)'),
+      target_fixture='nominatim_result')
+def reverse_geocode_via_api(test_config_env, pytestconfig, datatable, lat, lon):
+    runner = APIRunner(test_config_env, pytestconfig.option.NOMINATIM_API_ENGINE)
+    api_response = runner.run_step('reverse',
+                                   {'lat': float(lat), 'lon': float(lon)},
+                                   datatable, 'jsonv2', {})
+
+    assert api_response.status == 200
+    assert api_response.headers['content-type'] == 'application/json; charset=utf-8'
+
+    result = APIResult('json', 'reverse', api_response.body)
+    assert result.is_simple()
+
+    assert isinstance(result.result['lat'], str)
+    assert isinstance(result.result['lon'], str)
+    result.result['centroid'] = f"POINT({result.result['lon']} {result.result['lat']})"
+
+    return result
+
+
+@when(step_parse(r'reverse geocoding at node (?P<node>[\d]+)'),
+      target_fixture='nominatim_result')
+def reverse_geocode_via_api_and_grid(test_config_env, pytestconfig, node_grid, datatable, node):
+    coords = node_grid.get(node)
+    if coords is None:
+        raise ValueError('Unknown node id')
+
+    return reverse_geocode_via_api(test_config_env, pytestconfig, datatable, coords[1], coords[0])
+
+
+@when(step_parse(r'geocoding(?: "(?P<query>.*)")?'),
+      target_fixture='nominatim_result')
+def forward_geocode_via_api(test_config_env, pytestconfig, datatable, query):
+    runner = APIRunner(test_config_env, pytestconfig.option.NOMINATIM_API_ENGINE)
+
+    params = {'addressdetails': '1'}
+    if query:
+        params['q'] = query
+
+    api_response = runner.run_step('search', params, datatable, 'jsonv2', {})
+
+    assert api_response.status == 200
+    assert api_response.headers['content-type'] == 'application/json; charset=utf-8'
+
+    result = APIResult('json', 'search', api_response.body)
+    assert not result.is_simple()
+
+    for res in result.result:
+        assert isinstance(res['lat'], str)
+        assert isinstance(res['lon'], str)
+        res['centroid'] = f"POINT({res['lon']} {res['lat']})"
+
+    return result
+
+
+@then(step_parse(r'(?P<op>[a-z ]+) (?P<num>\d+) results? (?:are|is) returned'),
+      converters={'num': int})
+def check_number_of_results(nominatim_result, op, num):
+    assert not nominatim_result.is_simple()
+    assert COMPARATOR_TERMS[op](num, len(nominatim_result))
+
+
+@then(step_parse('the result metadata contains'))
+def check_metadata_for_fields(nominatim_result, datatable):
+    if datatable[0] == ['param', 'value']:
+        pairs = datatable[1:]
+    else:
+        pairs = zip(datatable[0], datatable[1])
+
+    for k, v in pairs:
+        assert ResultAttr(nominatim_result.meta, k) == v
+
+
+@then(step_parse('the result metadata has no attributes (?P<attributes>.*)'),
+      converters={'attributes': _strlist})
+def check_metadata_for_field_presence(nominatim_result, attributes):
+    assert all(a not in nominatim_result.meta for a in attributes), \
+        f"Unexpectedly have one of the attributes '{attributes}' in\n" \
+        f"{_pretty_json(nominatim_result.meta)}"
+
+
+@then(step_parse(r'the result contains(?: in field (?P<field>\S+))?'))
+def check_result_for_fields(nominatim_result, datatable, node_grid, field):
+    assert nominatim_result.is_simple()
+
+    if datatable[0] == ['param', 'value']:
+        pairs = datatable[1:]
+    else:
+        pairs = zip(datatable[0], datatable[1])
+
+    prefix = field + '+' if field else ''
+
+    for k, v in pairs:
+        assert ResultAttr(nominatim_result.result, prefix + k, grid=node_grid) == v
+
+
+@then(step_parse('the result has attributes (?P<attributes>.*)'),
+      converters={'attributes': _strlist})
+def check_result_for_field_presence(nominatim_result, attributes):
+    assert nominatim_result.is_simple()
+    assert all(a in nominatim_result.result for a in attributes)
+
+
+@then(step_parse('the result has no attributes (?P<attributes>.*)'),
+      converters={'attributes': _strlist})
+def check_result_for_field_absence(nominatim_result, attributes):
+    assert nominatim_result.is_simple()
+    assert all(a not in nominatim_result.result for a in attributes)
+
+
+@then(step_parse('the result set contains(?P<exact> exactly)?'))
+def check_result_list_match(nominatim_result, datatable, exact):
+    assert not nominatim_result.is_simple()
+
+    result_set = set(range(len(nominatim_result.result)))
+
+    for row in datatable[1:]:
+        for idx in result_set:
+            for key, value in zip(datatable[0], row):
+                if ResultAttr(nominatim_result.result[idx], key) != value:
+                    break
+            else:
+                # found a match
+                result_set.remove(idx)
+                break
+        else:
+            assert False, f"Missing data row {row}. Full response:\n{nominatim_result}"
+
+    if exact:
+        assert not [nominatim_result.result[i] for i in result_set]
+
+
+@then(step_parse('all results have attributes (?P<attributes>.*)'),
+      converters={'attributes': _strlist})
+def check_all_results_for_field_presence(nominatim_result, attributes):
+    assert not nominatim_result.is_simple()
+    assert len(nominatim_result) > 0
+    for res in nominatim_result.result:
+        assert all(a in res for a in attributes), \
+            f"Missing one of the attributes '{attributes}' in\n{_pretty_json(res)}"
+
+
+@then(step_parse('all results have no attributes (?P<attributes>.*)'),
+      converters={'attributes': _strlist})
+def check_all_result_for_field_absence(nominatim_result, attributes):
+    assert not nominatim_result.is_simple()
+    assert len(nominatim_result) > 0
+    for res in nominatim_result.result:
+        assert all(a not in res for a in attributes), \
+            f"Unexpectedly have one of the attributes '{attributes}' in\n{_pretty_json(res)}"
+
+
+@then(step_parse(r'all results contain(?: in field (?P<field>\S+))?'))
+def check_all_results_contain(nominatim_result, datatable, node_grid, field):
+    assert not nominatim_result.is_simple()
+    assert len(nominatim_result) > 0
+
+    if datatable[0] == ['param', 'value']:
+        pairs = datatable[1:]
+    else:
+        pairs = zip(datatable[0], datatable[1])
+
+    prefix = field + '+' if field else ''
+
+    for k, v in pairs:
+        for r in nominatim_result.result:
+            assert ResultAttr(r, prefix + k, grid=node_grid) == v
+
+
+@then(step_parse(r'result (?P<num>\d+) contains(?: in field (?P<field>\S+))?'),
+      converters={'num': int})
+def check_specific_result_for_fields(nominatim_result, datatable, num, field):
+    assert not nominatim_result.is_simple()
+    assert len(nominatim_result) > num
+
+    if datatable[0] == ['param', 'value']:
+        pairs = datatable[1:]
+    else:
+        pairs = zip(datatable[0], datatable[1])
+
+    prefix = field + '+' if field else ''
+
+    for k, v in pairs:
+        assert ResultAttr(nominatim_result.result[num], prefix + k) == v
+
+
+@given(step_parse(r'the (?P<step>[0-9.]+ )?grid(?: with origin (?P<origin>.*))?'),
+       target_fixture='node_grid')
+def set_node_grid(datatable, step, origin):
+    if step is not None:
+        step = float(step)
+
+    if origin:
+        if ',' in origin:
+            coords = origin.split(',')
+            if len(coords) != 2:
+                raise RuntimeError('Grid origin expects origin with x,y coordinates.')
+            origin = list(map(float, coords))
+        elif origin in ALIASES:
+            origin = ALIASES[origin]
+        else:
+            raise RuntimeError('Grid origin must be either coordinate or alias.')
+
+    return Grid(datatable, step, origin)
+
+
+@then(step_parse('(?P<table>placex?) has no entry for '
+                 r'(?P<osm_type>[NRW])(?P<osm_id>\d+)(?::(?P<osm_class>\S+))?'),
+      converters={'osm_id': int})
+def check_place_missing_lines(db_conn, table, osm_type, osm_id, osm_class):
+    sql = pysql.SQL("""SELECT count(*) FROM {}
+                       WHERE osm_type = %s and osm_id = %s""").format(pysql.Identifier(table))
+    params = [osm_type, int(osm_id)]
+    if osm_class:
+        sql += pysql.SQL(' AND class = %s')
+        params.append(osm_class)
+
+    with db_conn.cursor() as cur:
+        assert cur.execute(sql, params).fetchone()[0] == 0
diff --git a/test/bdd/db/import/naming.feature b/test/bdd/db/import/naming.feature
deleted file mode 100644
index b739cbae..00000000
--- a/test/bdd/db/import/naming.feature
+++ /dev/null
@@ -1,105 +0,0 @@
-@DB
-Feature: Import and search of names
-    Tests all naming related import issues
-
-    Scenario: No copying name tag if only one name
-        Given the places
-          | osm | class | type      | name   | geometry |
-          | N1  | place | locality  | german | country:de |
-        When importing
-        Then placex contains
-          | object | country_code | name+name |
-          | N1     | de           | german |
-
-    Scenario: Copying name tag to default language if it does not exist
-        Given the places
-          | osm | class | type      | name   | name+name:fi | geometry |
-          | N1  | place | locality  | german | finnish      | country:de |
-        When importing
-        Then placex contains
-          | object | country_code | name   | name+name:fi | name+name:de |
-          | N1     | de           | german | finnish      | german       |
-
-    Scenario: Copying default language name tag to name if it does not exist
-        Given the places
-          | osm | class | type     | name+name:de | name+name:fi | geometry |
-          | N1  | place | locality | german       | finnish      | country:de |
-        When importing
-        Then placex contains
-          | object | country_code | name   | name+name:fi | name+name:de |
-          | N1     | de           | german | finnish      | german       |
-
-    Scenario: Do not overwrite default language with name tag
-        Given the places
-          | osm | class | type     | name   | name+name:fi | name+name:de | geometry |
-          | N1  | place | locality | german | finnish      | local        | country:de |
-        When importing
-        Then placex contains
-          | object | country_code | name   | name+name:fi | name+name:de |
-          | N1     | de           | german | finnish      | local        |
-
-    Scenario Outline: Names in any script can be found
-        Given the places
-            | osm | class | type   | name   |
-            | N1  | place | hamlet | <name> |
-        When importing
-        And sending search query "<name>"
-        Then results contain
-            | osm |
-            | N1  |
-
-     Examples:
-        | name |
-        | Berlin |
-        | åäº¬ |
-        | ÐÐ¾Ð»Ð¾Ð³Ð´Ð° |
-        | ÎÎ¸Î®Î½Î± |
-        | Ø§ÙÙØ§ÙØ±Ø© |
-        | áá¶ááá¶áá¸ááááááá |
-        | æ±äº¬é½ |
-        | áá¯áá¹ááá®áá­ |
-
-
-    Scenario: German umlauts can be found when expanded
-        Given the places
-            | osm | class | type | name+name:de |
-            | N1  | place | city | MÃ¼nster      |
-            | N2  | place | city | KÃ¶ln         |
-            | N3  | place | city | GrÃ¤fenroda   |
-        When importing
-        When sending search query "mÃ¼nster"
-        Then results contain
-            | osm |
-            | N1  |
-        When sending search query "muenster"
-        Then results contain
-            | osm |
-            | N1  |
-        When sending search query "munster"
-        Then results contain
-            | osm |
-            | N1  |
-        When sending search query "KÃ¶ln"
-        Then results contain
-            | osm |
-            | N2  |
-        When sending search query "Koeln"
-        Then results contain
-            | osm |
-            | N2  |
-        When sending search query "Koln"
-        Then results contain
-            | osm |
-            | N2  |
-        When sending search query "grÃ¤fenroda"
-        Then results contain
-            | osm |
-            | N3  |
-        When sending search query "graefenroda"
-        Then results contain
-            | osm |
-            | N3  |
-        When sending search query "grafenroda"
-        Then results contain
-            | osm |
-            | N3  |
diff --git a/test/bdd/db/query/normalization.feature b/test/bdd/db/query/normalization.feature
deleted file mode 100644
index 47906133..00000000
--- a/test/bdd/db/query/normalization.feature
+++ /dev/null
@@ -1,226 +0,0 @@
-@DB
-Feature: Import and search of names
-    Tests all naming related issues: normalisation,
-    abbreviations, internationalisation, etc.
-
-    Scenario: non-latin scripts can be found
-        Given the places
-          | osm | class | type      | name |
-          | N1  | place | locality  | Ð ÐµÑÐ¸ÑÐºÐ¸Ð¹ ÑÐ°Ð¹Ð¾Ð½ |
-          | N2  | place | locality  | Refugio de montaÃ±a |
-          | N3  | place | locality  | é«æ§»å¸|
-          | N4  | place | locality  | Ø§ÙØ¯ÙØ­Ø© |
-        When importing
-        When sending search query "Ð ÐµÑÐ¸ÑÐºÐ¸Ð¹ ÑÐ°Ð¹Ð¾Ð½"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "Refugio de montaÃ±a"
-        Then results contain
-         | ID | osm |
-         | 0  | N2 |
-        When sending search query "é«æ§»å¸"
-        Then results contain
-         | ID | osm |
-         | 0  | N3 |
-        When sending search query "Ø§ÙØ¯ÙØ­Ø©"
-        Then results contain
-         | ID | osm |
-         | 0  | N4 |
-
-    Scenario: Case-insensitivity of search
-        Given the places
-          | osm | class | type      | name |
-          | N1  | place | locality  | FooBar |
-        When importing
-        Then placex contains
-          | object | class  | type     | name+name |
-          | N1     | place  | locality | FooBar |
-        When sending search query "FooBar"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "foobar"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "fOObar"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "FOOBAR"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-
-    Scenario: Multiple spaces in name
-        Given the places
-          | osm | class | type      | name |
-          | N1  | place | locality  | one two  three |
-        When importing
-        When sending search query "one two three"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "one   two three"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "one two  three"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "    one two three"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-
-    Scenario: Special characters in name
-        Given the places
-          | osm | class | type      | name+name:de |
-          | N1  | place | locality  | Jim-Knopf-StraÃe |
-          | N2  | place | locality  | Smith/Weston |
-          | N3  | place | locality  | space mountain |
-          | N4  | place | locality  | space |
-          | N5  | place | locality  | mountain |
-        When importing
-        When sending search query "Jim-Knopf-Str"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "Jim Knopf-Str"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "Jim Knopf Str"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "Jim/Knopf-Str"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "Jim-Knopfstr"
-        Then results contain
-         | ID | osm |
-         | 0  | N1 |
-        When sending search query "Smith/Weston"
-        Then results contain
-         | ID | osm |
-         | 0  | N2 |
-        When sending search query "Smith Weston"
-        Then results contain
-         | ID | osm |
-         | 0  | N2 |
-        When sending search query "Smith-Weston"
-        Then results contain
-         | ID | osm |
-         | 0  | N2 |
-        When sending search query "space mountain"
-        Then results contain
-         | ID | osm |
-         | 0  | N3 |
-        When sending search query "space-mountain"
-        Then results contain
-         | ID | osm |
-         | 0  | N3 |
-        When sending search query "space/mountain"
-        Then results contain
-         | ID | osm |
-         | 0  | N3 |
-        When sending search query "space\mountain"
-        Then results contain
-         | ID | osm |
-         | 0  | N3 |
-        When sending search query "space(mountain)"
-        Then results contain
-         | ID | osm |
-         | 0  | N3 |
-
-    Scenario: Landuse with name are found
-        Given the grid
-          | 1 | 2 |
-          | 3 |   |
-        Given the places
-          | osm | class    | type        | name     | geometry |
-          | R1  | natural  | meadow      | landuse1 | (1,2,3,1) |
-          | R2  | landuse  | industrial  | landuse2 | (2,3,1,2) |
-        When importing
-        When sending search query "landuse1"
-        Then results contain
-         | ID | osm |
-         | 0  | R1 |
-        When sending search query "landuse2"
-        Then results contain
-         | ID | osm |
-         | 0  | R2 |
-
-    Scenario: Postcode boundaries without ref
-        Given the grid with origin FR
-          |   | 2 |   |
-          | 1 |   | 3 |
-        Given the places
-          | osm | class    | type        | postcode  | geometry |
-          | R1  | boundary | postal_code | 123-45    | (1,2,3,1) |
-        When importing
-        When sending search query "123-45"
-        Then results contain
-         | ID | osm |
-         | 0  | R1 |
-
-    Scenario Outline: Housenumbers with special characters are found
-        Given the grid
-            | 1 |  |   |  | 2 |
-            |   |  | 9 |  |   |
-        And the places
-            | osm | class   | type    | name    | geometry |
-            | W1  | highway | primary | Main St | 1,2      |
-        And the places
-            | osm | class    | type | housenr | geometry |
-            | N1  | building | yes  | <nr>    | 9        |
-        When importing
-        And sending search query "Main St <nr>"
-        Then results contain
-         | osm | display_name |
-         | N1  | <nr>, Main St |
-
-    Examples:
-        | nr |
-        | 1  |
-        | 3456 |
-        | 1 a |
-        | 56b |
-        | 1 A |
-        | 2è |
-        | 1Ð  |
-        | 1 Ðº1 |
-        | 23-123 |
-
-    Scenario Outline: Housenumbers in lists are found
-        Given the grid
-            | 1 |  |   |  | 2 |
-            |   |  | 9 |  |   |
-        And the places
-            | osm | class   | type    | name    | geometry |
-            | W1  | highway | primary | Main St | 1,2      |
-        And the places
-            | osm | class    | type | housenr   | geometry |
-            | N1  | building | yes  | <nr-list> | 9        |
-        When importing
-        And sending search query "Main St <nr>"
-        Then results contain
-         | ID | osm | display_name |
-         | 0  | N1  | <nr-list>, Main St |
-
-    Examples:
-        | nr-list    | nr |
-        | 1,2,3      | 1  |
-        | 1,2,3      | 2  |
-        | 1, 2, 3    | 3  |
-        | 45 ;67;3   | 45 |
-        | 45 ;67;3   | 67 |
-        | 1a;1k      | 1a |
-        | 1a;1k      | 1k |
-        | 34/678     | 34 |
-        | 34/678     | 678 |
-        | 34/678     | 34/678 |
diff --git a/test/bdd/environment.py b/test/bdd/environment.py
deleted file mode 100644
index 7535c508..00000000
--- a/test/bdd/environment.py
+++ /dev/null
@@ -1,61 +0,0 @@
-# SPDX-License-Identifier: GPL-3.0-or-later
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2024 by the Nominatim developer community.
-# For a full list of authors see the git log.
-from pathlib import Path
-import sys
-
-from behave import *
-
-sys.path.insert(1, str(Path(__file__, '..', '..', '..', 'src').resolve()))
-
-from steps.geometry_factory import GeometryFactory
-from steps.nominatim_environment import NominatimEnvironment
-
-TEST_BASE_DIR = Path(__file__, '..', '..').resolve()
-
-userconfig = {
-    'REMOVE_TEMPLATE' : False,
-    'KEEP_TEST_DB' : False,
-    'DB_HOST' : None,
-    'DB_PORT' : None,
-    'DB_USER' : None,
-    'DB_PASS' : None,
-    'TEMPLATE_DB' : 'test_template_nominatim',
-    'TEST_DB' : 'test_nominatim',
-    'API_TEST_DB' : 'test_api_nominatim',
-    'API_TEST_FILE'  : TEST_BASE_DIR / 'testdb' / 'apidb-test-data.pbf',
-    'TOKENIZER' : None, # Test with a custom tokenizer
-    'STYLE' : 'extratags',
-    'API_ENGINE': 'falcon'
-}
-
-use_step_matcher("re")
-
-def before_all(context):
-    # logging setup
-    context.config.setup_logging()
-    # set up -D options
-    for k,v in userconfig.items():
-        context.config.userdata.setdefault(k, v)
-    # Nominatim test setup
-    context.nominatim = NominatimEnvironment(context.config.userdata)
-    context.osm = GeometryFactory()
-
-
-def before_scenario(context, scenario):
-    if not 'SQLITE' in context.tags \
-       and context.config.userdata['API_TEST_DB'].startswith('sqlite:'):
-        context.scenario.skip("Not usable with Sqlite database.")
-    elif 'DB' in context.tags:
-        context.nominatim.setup_db(context)
-    elif 'APIDB' in context.tags:
-        context.nominatim.setup_api_db()
-    elif 'UNKNOWNDB' in context.tags:
-        context.nominatim.setup_unknown_db()
-
-def after_scenario(context, scenario):
-    if 'DB' in context.tags:
-        context.nominatim.teardown_db(context)
diff --git a/test/bdd/features/api/details/language.feature b/test/bdd/features/api/details/language.feature
new file mode 100644
index 00000000..f15b4ffb
--- /dev/null
+++ b/test/bdd/features/api/details/language.feature
@@ -0,0 +1,83 @@
+Feature: Localization of search results
+
+    Scenario: default language
+        When sending v1/details
+          | osmtype | osmid   |
+          | R       | 1155955 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | localname |
+          | Liechtenstein |
+
+    Scenario: accept-language first
+        When sending v1/details
+          | osmtype | osmid   | accept-language |
+          | R       | 1155955 | zh,de |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | localname |
+          | åæ¯æ¦å£«ç» |
+
+    Scenario: accept-language missing
+        When sending v1/details
+          | osmtype | osmid   | accept-language |
+          | R       | 1155955 | xx,fr,en,de |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | localname |
+          | Liechtenstein |
+
+    Scenario: http accept language header first
+        Given the HTTP header
+          | accept-language |
+          | fo;q=0.8,en-ca;q=0.5,en;q=0.3 |
+        When sending v1/details
+          | osmtype | osmid   |
+          | R       | 1155955 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | localname |
+          | Liktinstein |
+
+    Scenario: http accept language header and accept-language
+        Given the HTTP header
+          | accept-language |
+          | fr-ca,fr;q=0.8,en-ca;q=0.5,en;q=0.3 |
+        When sending v1/details
+          | osmtype | osmid   | accept-language |
+          | R       | 1155955 | fo,en |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | localname |
+          | Liktinstein |
+
+    Scenario: http accept language header fallback
+        Given the HTTP header
+          | accept-language |
+          | fo-ca,en-ca;q=0.5 |
+        When sending v1/details
+          | osmtype | osmid   |
+          | R       | 1155955 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | localname |
+          | Liktinstein |
+
+    Scenario: http accept language header fallback (upper case)
+        Given the HTTP header
+          | accept-language |
+          | fo-FR;q=0.8,en-ca;q=0.5 |
+        When sending v1/details
+          | osmtype | osmid   |
+          | R       | 1155955 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | localname |
+          | Liktinstein |
diff --git a/test/bdd/features/api/details/params.feature b/test/bdd/features/api/details/params.feature
new file mode 100644
index 00000000..1212e70a
--- /dev/null
+++ b/test/bdd/features/api/details/params.feature
@@ -0,0 +1,99 @@
+Feature: Object details
+    Testing different parameter options for details API.
+
+    Scenario: Basic details
+        When sending v1/details
+          | osmtype | osmid |
+          | W       | 297699560 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes geometry
+        And the result has no attributes keywords,address,linked_places,parentof
+        And the result contains
+            | geometry+type  |
+            | Point |
+
+    Scenario: Basic details with pretty printing
+        When sending v1/details
+          | osmtype | osmid     | pretty |
+          | W       | 297699560 | 1      |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes geometry
+        And the result has no attributes keywords,address,linked_places,parentof
+
+    Scenario: Details with addressdetails
+        When sending v1/details
+          | osmtype | osmid     | addressdetails |
+          | W       | 297699560 | 1              |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes address
+
+    Scenario: Details with linkedplaces
+        When sending v1/details
+          | osmtype | osmid  | linkedplaces |
+          | R       | 123924 | 1            |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes linked_places
+
+    Scenario: Details with hierarchy
+        When sending v1/details
+          | osmtype | osmid     | hierarchy |
+          | W       | 297699560 | 1         |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes hierarchy
+
+    Scenario: Details with grouped hierarchy
+        When sending v1/details
+          | osmtype | osmid     | hierarchy | group_hierarchy |
+          | W       | 297699560 | 1         | 1               |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes hierarchy
+
+    Scenario Outline: Details with keywords
+        When sending v1/details
+            | osmtype | osmid | keywords |
+            | <type>  | <id>  | 1 |
+        Then a HTTP 200 is returned
+        Then the result is valid json
+        And the result has attributes keywords
+
+    Examples:
+      | type | id |
+      | W    | 297699560 |
+      | W    | 243055645 |
+      | W    | 243055716 |
+      | W    | 43327921  |
+
+    # ticket #1343
+    Scenario: Details of a country with keywords
+        When sending v1/details
+            | osmtype | osmid   | keywords |
+            | R       | 1155955 | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes keywords
+
+    Scenario Outline: Details with full geometry
+        When sending v1/details
+            | osmtype | osmid | polygon_geojson |
+            | <type>  | <id>  | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes geometry
+        And the result contains
+            | geometry+type |
+            | <geometry> |
+
+    Examples:
+            | type | id        | geometry   |
+            | W    | 297699560 | LineString |
+            | W    | 243055645 | Polygon    |
+            | W    | 243055716 | Polygon    |
+            | W    | 43327921  | LineString |
+
+
diff --git a/test/bdd/features/api/details/simple.feature b/test/bdd/features/api/details/simple.feature
new file mode 100644
index 00000000..4010d0ff
--- /dev/null
+++ b/test/bdd/features/api/details/simple.feature
@@ -0,0 +1,99 @@
+Feature: Object details
+    Check details page for correctness
+
+    Scenario Outline: Details request with OSM id
+        When sending v1/details
+          | osmtype | osmid |
+          | <type>  | <id>  |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+            | osm_type | osm_id |
+            | <type>   | <id> |
+
+    Examples:
+     | type | id |
+     | N    | 5484325405 |
+     | W    | 43327921 |
+     | R    | 123924 |
+
+    Scenario Outline: Details request with different class types for the same OSM id
+        When sending v1/details
+          | osmtype | osmid     | class   |
+          | N       | 300209696 | <class> |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | osm_type | osm_id    | category |
+          | N        | 300209696 | <class>  |
+
+    Examples:
+     | class |
+     | tourism |
+     | mountain_pass |
+
+    Scenario: Details request without osmtype
+        When sending v1/details
+          | osmid |
+          | <id>  |
+        Then a HTTP 400 is returned
+        And the result is valid json
+
+    Scenario: Details request with unknown OSM id
+        When sending v1/details
+          | osmtype | osmid |
+          | R       | 1     |
+        Then a HTTP 404 is returned
+        And the result is valid json
+
+    Scenario: Details request with unknown class
+        When sending v1/details
+          | osmtype | osmid     | class   |
+          | N       | 300209696 | highway |
+        Then a HTTP 404 is returned
+        And the result is valid json
+
+    Scenario: Details for interpolation way return the interpolation
+        When sending v1/details
+          | osmtype | osmid |
+          | W       | 1     |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | category | type   | osm_type | osm_id | admin_level |
+          | place    | houses | W        | 1      | 15          |
+
+
+    @skip
+    Scenario: Details for interpolation way return the interpolation
+        When sending details query for 112871
+        Then the result is valid json
+        And the result contains
+            | category | type   | admin_level |
+            | place    | houses | 15          |
+        And result has not attributes osm_type,osm_id
+
+
+    @skip
+    Scenario: Details for postcode
+        When sending details query for 112820
+        Then the result is valid json
+        And the result contains
+            | category | type     | admin_level |
+            | place    | postcode | 15          |
+        And result has not attributes osm_type,osm_id
+
+
+    Scenario Outline: Details debug output returns no errors
+        When sending v1/details
+          | osmtype | osmid | debug |
+          | <type>  | <id>  | 1     |
+        Then a HTTP 200 is returned
+        And the result is valid html
+
+    Examples:
+     | type | id |
+     | N    | 5484325405 |
+     | W    | 43327921 |
+     | R    | 123924 |
+
diff --git a/test/bdd/features/api/lookup/simple.feature b/test/bdd/features/api/lookup/simple.feature
new file mode 100644
index 00000000..6ecb88fa
--- /dev/null
+++ b/test/bdd/features/api/lookup/simple.feature
@@ -0,0 +1,71 @@
+Feature: Tests for finding places by osm_type and osm_id
+    Simple tests for response format.
+
+    Scenario Outline: Address lookup for existing object
+        When sending v1/lookup with format <format>
+          | osm_ids |
+          | N5484325405,W43327921,,R123924,X99,N0 |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And exactly 3 results are returned
+
+    Examples:
+        | format      | outformat   |
+        | xml         | xml         |
+        | json        | json        |
+        | jsonv2      | json        |
+        | geojson     | geojson     |
+        | geocodejson | geocodejson |
+
+    Scenario: Address lookup for non-existing or invalid object
+        When sending v1/lookup
+          | osm_ids |
+          | X99,,N0,nN158845944,ABC,,W9 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And exactly 0 results are returned
+
+    Scenario Outline: Boundingbox is returned
+        When sending v1/lookup with format <format>
+          | osm_ids |
+          | N5484325405,W43327921 |
+        Then the result is valid <outformat>
+        And the result set contains exactly
+          | object      | boundingbox!in_box |
+          | N5484325405 | 47.135,47.14,9.52,9.525 |
+          | W43327921   | 47.07,47.08,9.50,9.52   |
+
+    Examples:
+        | format      | outformat   |
+        | xml         | xml         |
+        | json        | json        |
+        | jsonv2      | json        |
+        | geojson     | geojson     |
+
+    Scenario: Linked places return information from the linkee
+        When sending v1/lookup with format geocodejson
+          | osm_ids |
+          | N1932181216 |
+        Then the result is valid geocodejson
+        And exactly 1 result is returned
+        And all results contain
+          | name  |
+          | Vaduz |
+
+    Scenario Outline: Force error by providing too many ids
+        When sending v1/lookup with format <format>
+          | osm_ids |
+          | N1,N2,N3,N4,N5,N6,N7,N8,N9,N10,N11,N12,N13,N14,N15,N16,N17,N18,N19,N20,N21,N22,N23,N24,N25,N26,N27,N28,N29,N30,N31,N32,N33,N34,N35,N36,N37,N38,N39,N40,N41,N42,N43,N44,N45,N46,N47,N48,N49,N50,N51 |
+        Then a HTTP 400 is returned
+        And the result is valid <outformat>
+        And the result contains
+          | error+code | error+message |
+          | 400        | Too many object IDs. |
+
+    Examples:
+        | format      | outformat   |
+        | xml         | xml         |
+        | json        | json        |
+        | jsonv2      | json        |
+        | geojson     | json        |
+        | geocodejson | json        |
diff --git a/test/bdd/features/api/reverse/geometry.feature b/test/bdd/features/api/reverse/geometry.feature
new file mode 100644
index 00000000..a04b4e01
--- /dev/null
+++ b/test/bdd/features/api/reverse/geometry.feature
@@ -0,0 +1,56 @@
+Feature: Geometries for reverse geocoding
+    Tests for returning geometries with reverse
+
+    Scenario: Reverse - polygons are returned fully by default
+        When sending v1/reverse
+          | lat      | lon     | polygon_text |
+          | 47.13803 | 9.52264 | 1            |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | geotext!fm |
+          | POLYGON\(\(9.5225302 47.138066, ?9.5225348 47.1379282, ?9.5226142 47.1379294, ?9.5226143 47.1379257, ?9.522615 47.137917, ?9.5226225 47.1379098, ?9.5226334 47.1379052, ?9.5226461 47.1379037, ?9.5226588 47.1379056, ?9.5226693 47.1379107, ?9.5226762 47.1379181, ?9.5226762 47.1379268, ?9.5226761 47.1379308, ?9.5227366 47.1379317, ?9.5227352 47.1379753, ?9.5227608 47.1379757, ?9.5227595 47.1380148, ?9.5227355 47.1380145, ?9.5227337 47.1380692, ?9.5225302 47.138066\)\) |
+
+
+    Scenario: Reverse - polygons can be slightly simplified
+        When sending v1/reverse
+          | lat      | lon     | polygon_text | polygon_threshold |
+          | 47.13803 | 9.52264 | 1            | 0.00001            |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | geotext!fm |
+          | POLYGON\(\(9.5225302 47.138066, ?9.5225348 47.1379282, ?9.5226142 47.1379294, ?9.5226225 47.1379098, ?9.5226588 47.1379056, ?9.5226761 47.1379308, ?9.5227366 47.1379317, ?9.5227352 47.1379753, ?9.5227608 47.1379757, ?9.5227595 47.1380148, ?9.5227355 47.1380145, ?9.5227337 47.1380692, ?9.5225302 47.138066\)\) |
+
+
+    Scenario: Reverse - polygons can be much simplified
+        When sending v1/reverse
+          | lat      | lon     | polygon_text | polygon_threshold |
+          | 47.13803 | 9.52264 | 1            | 0.9               |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | geotext!fm |
+          | POLYGON\(\([0-9. ]+, ?[0-9. ]+, ?[0-9. ]+, ?[0-9. ]+(, ?[0-9. ]+)?\)\) |
+
+
+    Scenario: Reverse - for polygons return the centroid as center point
+        When sending v1/reverse
+          | lat      | lon     |
+          | 47.13836 | 9.52304 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | lon       | lat        |
+          | 9.5227108 | 47.1381805 |
+
+
+    Scenario: Reverse - for streets return the closest point as center point
+        When sending v1/reverse
+          | lat      | lon     |
+          | 47.13368 | 9.52942 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | lon       | lat        |
+          | 9.5294315 | 47.1336817 |
diff --git a/test/bdd/features/api/reverse/language.feature b/test/bdd/features/api/reverse/language.feature
new file mode 100644
index 00000000..927f258c
--- /dev/null
+++ b/test/bdd/features/api/reverse/language.feature
@@ -0,0 +1,47 @@
+Feature: Localization of reverse search results
+
+    Scenario: Reverse - default language
+        When sending v1/reverse with format jsonv2
+          | lat   | lon  |
+          | 47.14 | 9.55 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | address+country |
+          | Liechtenstein |
+
+    Scenario: Reverse - accept-language parameter
+        When sending v1/reverse with format jsonv2
+          | lat   | lon  | accept-language |
+          | 47.14 | 9.55 | ja,en |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | address+country |
+          | ãªããã³ã·ã¥ã¿ã¤ã³ |
+
+    Scenario: Reverse - HTTP accept language header
+        Given the HTTP header
+          | accept-language |
+          | fo-ca,fo;q=0.8,en-ca;q=0.5,en;q=0.3 |
+        When sending v1/reverse with format jsonv2
+          | lat   | lon  |
+          | 47.14 | 9.55 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | address+country |
+          | Liktinstein |
+
+    Scenario: Reverse - accept-language parameter and HTTP header
+        Given the HTTP header
+          | accept-language |
+          | fo-ca,fo;q=0.8,en-ca;q=0.5,en;q=0.3 |
+        When sending v1/reverse with format jsonv2
+          | lat   | lon  | accept-language |
+          | 47.14 | 9.55 | en |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | address+country |
+          | Liechtenstein |
diff --git a/test/bdd/api/reverse/layers.feature b/test/bdd/features/api/reverse/layers.feature
similarity index 80%
rename from test/bdd/api/reverse/layers.feature
rename to test/bdd/features/api/reverse/layers.feature
index f1885f0e..809d7e3d 100644
--- a/test/bdd/api/reverse/layers.feature
+++ b/test/bdd/features/api/reverse/layers.feature
@@ -1,24 +1,20 @@
-@SQLITE
-@APIDB
 Feature: Layer parameter in reverse geocoding
     Testing correct function of layer selection while reverse geocoding
 
     Scenario: POIs are selected by default
-        When sending v1/reverse at 47.14077,9.52414
-        Then results contain
+        When reverse geocoding 47.14077,9.52414
+        Then the result contains
           | category | type      |
           | tourism  | viewpoint |
 
-
     Scenario Outline: Same address level POI with different layers
-        When sending v1/reverse at 47.14077,9.52414
+        When reverse geocoding 47.14077,9.52414
           | layer   |
           | <layer> |
-        Then results contain
+        Then the result contains
           | category   |
           | <category> |
 
-
         Examples:
           | layer           | category |
           | address         | highway  |
@@ -28,12 +24,11 @@ Feature: Layer parameter in reverse geocoding
           | address,natural | highway  |
           | natural,poi     | tourism  |
 
-
      Scenario Outline: POIs are not selected without housenumber for address layer
-        When sending v1/reverse at 47.13816,9.52168
+        When reverse geocoding 47.13816,9.52168
           | layer   |
           | <layer> |
-        Then results contain
+        Then the result contains
           | category   | type   |
           | <category> | <type> |
 
@@ -42,21 +37,19 @@ Feature: Layer parameter in reverse geocoding
           | address,poi | highway  | bus_stop |
           | address     | amenity  | parking  |
 
-
      Scenario: Between natural and low-zoom address prefer natural
-         When sending v1/reverse at 47.13636,9.52094
+         When reverse geocoding 47.13636,9.52094
            | layer           | zoom |
            | natural,address | 15   |
-         Then results contain
+         Then the result contains
            | category |
            | waterway |
 
-
     Scenario Outline: Search for mountain peaks begins at level 12
-        When sending v1/reverse at 47.08293,9.57109
+        When reverse geocoding 47.08293,9.57109
           | layer   | zoom   |
           | natural | <zoom> |
-        Then results contain
+        Then the result contains
           | category   | type   |
           | <category> | <type> |
 
@@ -65,12 +58,11 @@ Feature: Layer parameter in reverse geocoding
           | 12   | natural  | peak  |
           | 13   | waterway | river |
 
-
      Scenario Outline: Reverse search with manmade layers
-        When sending v1/reverse at 32.46904,-86.44439
+        When reverse geocoding 32.46904,-86.44439
           | layer   |
           | <layer> |
-        Then results contain
+        Then the result contains
           | category   | type   |
           | <category> | <type> |
 
diff --git a/test/bdd/features/api/reverse/queries.feature b/test/bdd/features/api/reverse/queries.feature
new file mode 100644
index 00000000..eb1ae75f
--- /dev/null
+++ b/test/bdd/features/api/reverse/queries.feature
@@ -0,0 +1,80 @@
+Feature: Reverse geocoding
+    Testing the reverse function
+
+    Scenario: Reverse - Unknown countries fall back to default country grid
+        When reverse geocoding 45.174,-103.072
+        Then the result contains
+          | category | type    | display_name |
+          | place    | country | United States |
+
+    Scenario: Reverse - No TIGER house number for zoom < 18
+        When reverse geocoding 32.4752389363,-86.4810198619
+          | zoom |
+          | 17 |
+        Then the result contains
+          | osm_type | category |
+          | way      | highway  |
+        And the result contains in field address
+          | road                | postcode | country_code |
+          | Upper Kingston Road | 36067    | us |
+
+    Scenario: Reverse - Address with non-numerical house number
+        When reverse geocoding 47.107465,9.52838521614
+        Then the result contains in field address
+          | house_number | road |
+          | 39A/B        | Dorfstrasse |
+
+    Scenario: Reverse - Address with numerical house number
+        When reverse geocoding 47.168440329479594,9.511551699184338
+        Then the result contains in field address
+          | house_number | road |
+          | 6            | SchmedgÃ¤ssle |
+
+    Scenario Outline: Reverse - Zoom levels below 5 result in country
+        When reverse geocoding 47.16,9.51
+         | zoom |
+         | <zoom> |
+        Then the result contains
+         | display_name |
+         | Liechtenstein |
+
+        Examples:
+             | zoom |
+             | 0    |
+             | 1    |
+             | 2    |
+             | 3    |
+             | 4    |
+
+    Scenario: Reverse - When on a street, the closest interpolation is shown
+        When reverse geocoding 47.118457166193245,9.570678289621355
+         | zoom |
+         | 18 |
+        Then the result contains
+         | display_name |
+         | 1021, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
+
+    # github 2214
+    Scenario: Reverse - Interpolations do not override house numbers when they are closer
+        When reverse geocoding 47.11778,9.57255
+         | zoom |
+         | 18 |
+        Then the result contains
+         | display_name |
+         | 5, Grosssteg, Steg, Triesenberg, Oberland, 9497, Liechtenstein |
+
+    Scenario: Reverse - Interpolations do not override house numbers when they are closer (2)
+        When reverse geocoding 47.11834,9.57167
+         | zoom |
+         | 18 |
+        Then the result contains
+         | display_name |
+         | 3, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
+
+    Scenario: Reverse - When on a street with zoom 18, the closest housenumber is returned
+        When reverse geocoding 47.11755503977281,9.572722250405036
+         | zoom |
+         | 18 |
+        Then the result contains in field address
+         | house_number |
+         | 7 |
diff --git a/test/bdd/features/api/reverse/v1_geocodejson.feature b/test/bdd/features/api/reverse/v1_geocodejson.feature
new file mode 100644
index 00000000..40be511d
--- /dev/null
+++ b/test/bdd/features/api/reverse/v1_geocodejson.feature
@@ -0,0 +1,143 @@
+Feature: Geocodejson for Reverse API
+    Testing correctness of geocodejson output (API version v1).
+
+    Scenario Outline: Reverse geocodejson - Simple with no results
+        When sending v1/reverse with format geocodejson
+          | lat   | lon   |
+          | <lat> | <lon> |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | error |
+          | Unable to geocode |
+
+        Examples:
+          | lat  | lon |
+          | 0.0  | 0.0 |
+          | 91.3 | 0.4    |
+          | -700 | 0.4    |
+          | 0.2  | 324.44 |
+          | 0.2  | -180.4 |
+
+    Scenario Outline: Reverse geocodejson - Simple OSM result
+        When sending v1/reverse with format geocodejson
+          | lat    | lon   | addressdetails |
+          | 47.066 | 9.504 | <has_address>  |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And the result metadata contains
+          | version | licence | attribution!fm |
+          | 0.1.0   | ODbL    | Data Â© OpenStreetMap contributors, ODbL 1.0. https?://osm.org/copyright |
+        And all results have <attributes> country,postcode,county,city,district,street,housenumber,admin
+        And all results contain
+          | param               | value |
+          | osm_type            | node |
+          | osm_id              | 6522627624 |
+          | osm_key             | shop |
+          | osm_value           | bakery |
+          | type                | house |
+          | name                | DorfbÃ¤ckerei Herrmann |
+          | label               | DorfbÃ¤ckerei Herrmann, 29, Gnetsch, MÃ¤ls, Balzers, Oberland, 9496, Liechtenstein |
+          | geojson+type        | Point |
+          | geojson+coordinates | [9.5036065, 47.0660892] |
+
+        Examples:
+          | has_address | attributes     |
+          | 1           | attributes     |
+          | 0           | no attributes |
+
+    Scenario: Reverse geocodejson - City housenumber-level address with street
+        When sending v1/reverse with format geocodejson
+          | lat        | lon        |
+          | 47.1068011 | 9.52810091 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And all results contain
+          | housenumber | street    | postcode | city    | country |
+          | 8           | Im Winkel | 9495     | Triesen | Liechtenstein |
+         And all results contain
+          | admin+level6 | admin+level8 |
+          | Oberland     | Triesen      |
+
+    Scenario: Reverse geocodejson - Town street-level address with street
+        When sending v1/reverse with format geocodejson
+          | lat    | lon   | zoom |
+          | 47.066 | 9.504 | 16 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And all results contain
+          | name    | city    | postcode | country |
+          | Gnetsch | Balzers | 9496     | Liechtenstein |
+
+    Scenario: Reverse geocodejson - Poi street-level address with footway
+        When sending v1/reverse with format geocodejson
+          | lat      | lon     |
+          | 47.06515 | 9.50083 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And all results contain
+          | street  | city    | postcode | country |
+          | Burgweg | Balzers | 9496     | Liechtenstein |
+
+    Scenario: Reverse geocodejson - City address with suburb
+        When sending v1/reverse with format geocodejson
+          | lat       | lon      |
+          | 47.146861 | 9.511771 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And all results contain
+          | housenumber | street   | district | city  | postcode | country |
+          | 5           | Lochgass | Ebenholz | Vaduz | 9490     | Liechtenstein |
+
+    Scenario: Reverse geocodejson - Tiger address
+        When sending v1/reverse with format geocodejson
+          | lat           | lon            |
+          | 32.4752389363 | -86.4810198619 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And all results contain
+         | osm_type | osm_id    | osm_key | osm_value | type  |
+         | way      | 396009653 | place   | house     | house |
+        And all results contain
+         | housenumber | street              | city       | county         | postcode | country       |
+         | 707         | Upper Kingston Road | Prattville | Autauga County | 36067    | United States |
+
+    Scenario: Reverse geocodejson - Interpolation address
+        When sending v1/reverse with format geocodejson
+          | lat       | lon        |
+          | 47.118533 | 9.57056562 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And all results contain
+          | osm_type | osm_id | osm_key | osm_value | type  |
+          | way      | 1      | place   | house     | house |
+        And all results contain
+          | label |
+          | 1019, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
+        And all results have no attributes name
+
+    Scenario: Reverse geocodejson - Line geometry output is supported
+        When sending v1/reverse with format geocodejson
+          | lat      | lon     | polygon_geojson |
+          | 47.06597 | 9.50467 | 1  |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And all results contain
+          | geojson+type |
+          | LineString   |
+
+    Scenario Outline: Reverse geocodejson - Only geojson polygons are supported
+        When sending v1/reverse with format geocodejson
+          | lat      | lon     | <param> |
+          | 47.06597 | 9.50467 | 1       |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson with 1 result
+        And all results contain
+          | geojson+type |
+          | Point        |
+
+        Examples:
+          | param |
+          | polygon_text |
+          | polygon_svg  |
+          | polygon_kml  |
diff --git a/test/bdd/features/api/reverse/v1_geojson.feature b/test/bdd/features/api/reverse/v1_geojson.feature
new file mode 100644
index 00000000..83f98e65
--- /dev/null
+++ b/test/bdd/features/api/reverse/v1_geojson.feature
@@ -0,0 +1,102 @@
+Feature: Geojson for Reverse API
+    Testing correctness of geojson output (API version v1).
+
+    Scenario Outline: Reverse geojson - Simple with no results
+        When sending v1/reverse with format geojson
+          | lat   | lon   |
+          | <lat> | <lon> |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | error |
+          | Unable to geocode |
+
+        Examples:
+          | lat  | lon |
+          | 0.0  | 0.0 |
+          | 91.3 | 0.4    |
+          | -700 | 0.4    |
+          | 0.2  | 324.44 |
+          | 0.2  | -180.4 |
+
+    Scenario Outline: Reverse geojson - Simple OSM result
+        When sending v1/reverse with format geojson
+          | lat    | lon   | addressdetails |
+          | 47.066 | 9.504 | <has_address>  |
+        Then a HTTP 200 is returned
+        And the result is valid geojson with 1 result
+        And the result metadata contains
+          | licence!fm |
+          | Data Â© OpenStreetMap contributors, ODbL 1.0. http://osm.org/copyright |
+        And all results have attributes place_id, importance
+        And all results have <attributes> address
+        And all results contain
+          | param               | value |
+          | osm_type            | node |
+          | osm_id              | 6522627624 |
+          | place_rank          | 30 |
+          | category            | shop |
+          | type                | bakery |
+          | addresstype         | shop |
+          | name                | DorfbÃ¤ckerei Herrmann |
+          | display_name        | DorfbÃ¤ckerei Herrmann, 29, Gnetsch, MÃ¤ls, Balzers, Oberland, 9496, Liechtenstein |
+          | boundingbox         | [47.0660392, 47.0661392, 9.5035565, 9.5036565] |
+          | geojson+type        | Point |
+          | geojson+coordinates | [9.5036065, 47.0660892] |
+
+        Examples:
+          | has_address | attributes    |
+          | 1           | attributes    |
+          | 0           | no attributes |
+
+    Scenario: Reverse geojson - Tiger address
+        When sending v1/reverse with format geojson
+          | lat           | lon            |
+          | 32.4752389363 | -86.4810198619 |
+        Then a HTTP 200 is returned
+        And the result is valid geojson with 1 result
+        And all results contain
+          | osm_type | osm_id    | category | type  | addresstype  | place_rank |
+          | way      | 396009653 | place    | house | place        | 30         |
+
+    Scenario: Reverse geojson - Interpolation address
+        When sending v1/reverse with format geojson
+          | lat       | lon        |
+          | 47.118533 | 9.57056562 |
+        Then a HTTP 200 is returned
+        And the result is valid geojson with 1 result
+        And all results contain
+          | osm_type | osm_id | place_rank | category | type    | addresstype |
+          | way      | 1      | 30         | place    | house   | place       |
+        And all results contain
+          | boundingbox!in_box |
+          | 47.118494, 47.118596, 9.570495, 9.570597 |
+        And all results contain
+          | display_name |
+          | 1019, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
+
+    Scenario: Reverse geojson - Line geometry output is supported
+        When sending v1/reverse with format geojson
+          | lat      | lon     | polygon_geojson |
+          | 47.06597 | 9.50467 | 1               |
+        Then a HTTP 200 is returned
+        And the result is valid geojson with 1 result
+        And all results contain
+          | geojson+type |
+          | LineString   |
+
+    Scenario Outline: Reverse geojson - Only geojson polygons are supported
+        When sending v1/reverse with format geojson
+          | lat      | lon     | <param> |
+          | 47.06597 | 9.50467 | 1       |
+        Then a HTTP 200 is returned
+        And the result is valid geojson with 1 result
+        And all results contain
+          | geojson+type |
+          | Point |
+
+        Examples:
+          | param |
+          | polygon_text |
+          | polygon_svg  |
+          | polygon_kml  |
diff --git a/test/bdd/features/api/reverse/v1_json.feature b/test/bdd/features/api/reverse/v1_json.feature
new file mode 100644
index 00000000..829adc5a
--- /dev/null
+++ b/test/bdd/features/api/reverse/v1_json.feature
@@ -0,0 +1,175 @@
+Feature: Json output for Reverse API
+    Testing correctness of json and jsonv2 output (API version v1).
+
+    Scenario Outline: Reverse json - Simple with no results
+        When sending v1/reverse with format json
+          | lat   | lon   |
+          | <lat> | <lon> |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | error |
+          | Unable to geocode |
+        When sending v1/reverse with format jsonv2
+          | lat   | lon   |
+          | <lat> | <lon> |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | error |
+          | Unable to geocode |
+
+        Examples:
+          | lat  | lon |
+          | 0.0  | 0.0 |
+          | 91.3 | 0.4    |
+          | -700 | 0.4    |
+          | 0.2  | 324.44 |
+          | 0.2  | -180.4 |
+
+    Scenario Outline: Reverse json - OSM result with and without addresses
+        When sending v1/reverse with format json
+          | lat    | lon   | addressdetails |
+          | 47.066 | 9.504 | <has_address>  |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has <attributes> address
+        When sending v1/reverse with format jsonv2
+          | lat    | lon   | addressdetails |
+          | 47.066 | 9.504 | <has_address>  |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has <attributes> address
+
+        Examples:
+          | has_address | attributes    |
+          | 1           | attributes    |
+          | 0           | no attributes |
+
+    Scenario Outline: Reverse json - Simple OSM result
+        When sending v1/reverse with format <format>
+          | lat    | lon   |
+          | 47.066 | 9.504 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes place_id
+        And the result contains
+          | licence!fm |
+          | Data Â© OpenStreetMap contributors, ODbL 1.0. https?://osm.org/copyright |
+        And the result contains
+          | osm_type | osm_id     |
+          | node     | 6522627624 |
+        And the result contains
+          | lon       | lat        | boundingbox!in_box |
+          | 9.5036065 | 47.0660892 | 47.0660391, 47.0661393, 9.5035564, 9.5036566 |
+        And the result contains
+          | display_name |
+          | DorfbÃ¤ckerei Herrmann, 29, Gnetsch, MÃ¤ls, Balzers, Oberland, 9496, Liechtenstein |
+        And the result has no attributes namedetails,extratags
+
+        Examples:
+          | format |
+          | json   |
+          | jsonv2 |
+
+    Scenario: Reverse json - Extra attributes of jsonv2 result
+        When sending v1/reverse with format jsonv2
+          | lat    | lon   |
+          | 47.066 | 9.504 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result has attributes importance
+        And the result contains
+          | category | type   | name                  | place_rank | addresstype |
+          | shop     | bakery | DorfbÃ¤ckerei Herrmann | 30         | shop        |
+
+    Scenario: Reverse json - Tiger address
+        When sending v1/reverse with format jsonv2
+          | lat           | lon            |
+          | 32.4752389363 | -86.4810198619 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | osm_type | osm_id    | category | type  | addresstype  |
+          | way      | 396009653 | place    | house | place        |
+
+    Scenario Outline: Reverse json - Interpolation address
+        When sending v1/reverse with format <format>
+          | lat       | lon        |
+          | 47.118533 | 9.57056562 |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | osm_type | osm_id |
+          | way      | 1      |
+        And the result contains
+          | lon       | lat        | boundingbox!in_box |
+          | 9.5705468 | 47.1185454 | 47.118494, 47.118596, 9.570495, 9.570597 |
+        And the result contains
+          | display_name |
+          | 1019, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
+
+        Examples:
+          | format |
+          | json   |
+          | jsonv2 |
+
+    Scenario Outline: Reverse json - Output of geojson
+        When sending v1/reverse with format <format>
+          | lat      | lon     | polygon_geojson |
+          | 47.06597 | 9.50467 | 1               |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | geojson+type | geojson+coordinates |
+          | LineString   | [[9.5039353, 47.0657546], [9.5040437, 47.0657781], [9.5040808, 47.065787], [9.5054298, 47.0661407]] |
+
+       Examples:
+          | format |
+          | json   |
+          | jsonv2 |
+
+    Scenario Outline: Reverse json - Output of WKT
+        When sending v1/reverse with format <format>
+          | lat      | lon     | polygon_text |
+          | 47.06597 | 9.50467 | 1            |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | geotext!wkt |
+          | 9.5039353 47.0657546, 9.5040437 47.0657781, 9.5040808 47.065787, 9.5054298 47.0661407 |
+
+       Examples:
+          | format |
+          | json   |
+          | jsonv2 |
+
+    Scenario Outline: Reverse json - Output of SVG
+       When sending v1/reverse with format <format>
+          | lat      | lon     | polygon_svg |
+          | 47.06597 | 9.50467 | 1           |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | svg |
+          | M 9.5039353 -47.0657546 L 9.5040437 -47.0657781 9.5040808 -47.065787 9.5054298 -47.0661407 |
+
+       Examples:
+          | format |
+          | json   |
+          | jsonv2 |
+
+    Scenario Outline: Reverse json - Output of KML
+        When sending v1/reverse with format <format>
+          | lat      | lon     | polygon_kml |
+          | 47.06597 | 9.50467 | 1           |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | geokml!fm |
+          | <LineString><coordinates>9.5039\d*,47.0657\d* 9.5040\d*,47.0657\d* 9.5040\d*,47.065\d* 9.5054\d*,47.0661\d*</coordinates></LineString> |
+
+       Examples:
+          | format |
+          | json   |
+          | jsonv2 |
diff --git a/test/bdd/features/api/reverse/v1_params.feature b/test/bdd/features/api/reverse/v1_params.feature
new file mode 100644
index 00000000..8708a10a
--- /dev/null
+++ b/test/bdd/features/api/reverse/v1_params.feature
@@ -0,0 +1,169 @@
+Feature: v1/reverse Parameter Tests
+    Tests for parameter inputs for the v1 reverse endpoint.
+    This file contains mostly bad parameter input. Valid parameters
+    are tested in the format tests.
+
+    Scenario: Bad format
+        When sending v1/reverse
+          | lat         | lon           | format |
+          | 47.14122383 | 9.52169581334 | sdf |
+        Then a HTTP 400 is returned
+
+    Scenario: Missing lon parameter
+        When sending v1/reverse
+          | lat   |
+          | 52.52 |
+        Then a HTTP 400 is returned
+
+    Scenario: Missing lat parameter
+        When sending v1/reverse
+          | lon |
+          | 52.52 |
+        Then a HTTP 400 is returned
+
+    Scenario Outline: Bad format for lat or lon
+        When sending v1/reverse
+          | lat   | lon   |
+          | <lat> | <lon> |
+        Then a HTTP 400 is returned
+
+        Examples:
+          | lat      | lon |
+          | 48.9660  | 8,4482 |
+          | 48,9660  | 8.4482 |
+          | 48,9660  | 8,4482 |
+          | 48.966.0 | 8.4482 |
+          | 48.966   | 8.448.2 |
+          | Nan      | 8.448  |
+          | 48.966   | Nan    |
+          | Inf      | 5.6    |
+          | 5.6      | -Inf   |
+          | <script></script> | 3.4 |
+          | 3.4 | <script></script> |
+          | -45.3    | ;      |
+          | gkjd     | 50     |
+
+    Scenario: Non-numerical zoom levels return an error
+        When sending v1/reverse
+          | lat         | lon           | zoom |
+          | 47.14122383 | 9.52169581334 | adfe |
+        Then a HTTP 400 is returned
+
+    Scenario Outline: Truthy values for boolean parameters
+        When sending v1/reverse
+          | lat         | lon           | addressdetails |
+          | 47.14122383 | 9.52169581334 | <value> |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result has attributes address
+
+        When sending v1/reverse
+          | lat         | lon           | extratags |
+          | 47.14122383 | 9.52169581334 | <value> |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result has attributes extratags
+
+        When sending v1/reverse
+          | lat         | lon           | namedetails |
+          | 47.14122383 | 9.52169581334 | <value> |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result has attributes namedetails
+
+        Examples:
+          | value |
+          | yes   |
+          | no    |
+          | -1    |
+          | 100   |
+          | false |
+          | 00    |
+
+    Scenario: Only one geometry can be requested
+        When sending v1/reverse
+          | lat         | lon           | polygon_text | polygon_svg |
+          | 47.14122383 | 9.52169581334 | 1            | 1           |
+        Then a HTTP 400 is returned
+
+    Scenario Outline: Illegal jsonp are not allowed
+        When sending v1/reverse with format json
+          | lat         | lon           | json_callback |
+          | 47.14122383 | 9.52169581334 | <data> |
+        Then a HTTP 400 is returned
+
+        Examples:
+          | data |
+          | 1asd |
+          | bar(foo) |
+          | XXX['bad'] |
+          | foo; evil |
+
+    Scenario Outline: Reverse debug mode produces valid HTML
+        When sending v1/reverse
+          | lat   | lon   | debug |
+          | <lat> | <lon> | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid html
+
+        Examples:
+          | lat      | lon     |
+          | 0.0      | 0.0     |
+          | 47.06645 | 9.56601 |
+          | 47.14081 | 9.52267 |
+
+    Scenario Outline: Full address display for city housenumber-level address with street
+        When sending v1/reverse with format <format>
+          | lat        | lon        |
+          | 47.1068011 | 9.52810091 |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And the result contains in field address
+          | param          | value     |
+          | house_number   | 8         |
+          | road           | Im Winkel |
+          | neighbourhood  | Oberdorf  |
+          | village        | Triesen   |
+          | ISO3166-2-lvl8 | LI-09     |
+          | county         | Oberland  |
+          | postcode       | 9495      |
+          | country        | Liechtenstein |
+          | country_code   | li        |
+
+        Examples:
+          | format  | outformat |
+          | json    | json |
+          | jsonv2  | json |
+          | xml     | xml |
+
+    Scenario Outline: Results with name details
+        When sending v1/reverse with format <format>
+          | lat      | lon     | zoom | namedetails |
+          | 47.14052 | 9.52202 | 14   | 1           |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And the result contains in field namedetails
+          | name     |
+          | Ebenholz |
+
+        Examples:
+          | format  | outformat |
+          | json    | json |
+          | jsonv2  | json |
+          | xml     | xml |
+
+    Scenario Outline: Results with extratags
+        When sending v1/reverse with format <format>
+          | lat      | lon     | zoom | extratags |
+          | 47.14052 | 9.52202 | 14   | 1         |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And the result contains in field extratags
+          | wikidata |
+          | Q4529531 |
+
+        Examples:
+          | format | outformat |
+          | json   | json |
+          | jsonv2 | json |
+          | xml    | xml |
diff --git a/test/bdd/features/api/reverse/v1_xml.feature b/test/bdd/features/api/reverse/v1_xml.feature
new file mode 100644
index 00000000..55cf0196
--- /dev/null
+++ b/test/bdd/features/api/reverse/v1_xml.feature
@@ -0,0 +1,116 @@
+Feature: XML output for Reverse API
+    Testing correctness of xml output (API version v1).
+
+    Scenario Outline: Reverse XML - Simple reverse-geocoding with no results
+        When sending v1/reverse
+          | lat   | lon   |
+          | <lat> | <lon> |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result has no attributes osm_type, address, extratags
+        And the result contains
+          | error |
+          | Unable to geocode |
+
+        Examples:
+         | lat      | lon |
+         | 0.0      | 0.0 |
+         | 91.3     | 0.4    |
+         | -700     | 0.4    |
+         | 0.2      | 324.44 |
+         | 0.2      | -180.4 |
+
+    Scenario Outline: Reverse XML - OSM result with and without addresses
+        When sending v1/reverse with format xml
+          | lat    | lon   | addressdetails |
+          | 47.066 | 9.504 | <has_address>  |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result has attributes place_id
+        And the result has <attributes> address
+        And the result contains
+          | osm_type | osm_id     | place_rank | address_rank |
+          | node     | 6522627624 | 30         | 30           |
+        And the result contains
+          | lon       | lat        | boundingbox |
+          | 9.5036065 | 47.0660892 | 47.0660392,47.0661392,9.5035565,9.5036565 |
+        And the result contains
+          | ref                   | display_name |
+          | DorfbÃ¤ckerei Herrmann | DorfbÃ¤ckerei Herrmann, 29, Gnetsch, MÃ¤ls, Balzers, Oberland, 9496, Liechtenstein |
+
+        Examples:
+          | has_address | attributes     |
+          | 1           | attributes     |
+          | 0           | no attributes |
+
+    Scenario: Reverse XML - Tiger address
+        When sending v1/reverse with format xml
+          | lat           | lon            |
+          | 32.4752389363 | -86.4810198619 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | osm_type | osm_id    | place_rank  | address_rank |
+          | way      | 396009653 | 30          | 30           |
+        And the result contains
+          | lon         | lat        | boundingbox |
+          | -86.4808553 | 32.4753580 | 32.4753080,32.4754080,-86.4809053,-86.4808053 |
+        And the result contains
+          | display_name |
+          | 707, Upper Kingston Road, Upper Kingston, Prattville, Autauga County, 36067, United States |
+
+    Scenario: Reverse XML - Interpolation address
+        When sending v1/reverse with format xml
+          | lat       | lon        |
+          | 47.118533 | 9.57056562 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | osm_type | osm_id | place_rank | address_rank |
+          | way      | 1      | 30         | 30           |
+        And the result contains
+          | lon       | lat        | boundingbox |
+          | 9.5705468 | 47.1185454 | 47.1184954,47.1185954,9.5704968,9.5705968 |
+        And the result contains
+          | display_name |
+          | 1019, Grosssteg, SÃ¼cka, Triesenberg, Oberland, 9497, Liechtenstein |
+
+    Scenario: Reverse XML - Output of geojson
+        When sending v1/reverse with format xml
+          | lat      | lon     | polygon_geojson |
+          | 47.06597 | 9.50467 | 1               |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | geojson |
+          | {"type":"LineString","coordinates":[[9.5039353,47.0657546],[9.5040437,47.0657781],[9.5040808,47.065787],[9.5054298,47.0661407]]}  |
+
+    Scenario: Reverse XML - Output of WKT
+        When sending v1/reverse with format xml
+          | lat      | lon     | polygon_text |
+          | 47.06597 | 9.50467 | 1            |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | geotext!wkt |
+          | 9.5039353 47.0657546, 9.5040437 47.0657781, 9.5040808 47.065787, 9.5054298 47.0661407 |
+
+    Scenario: Reverse XML - Output of SVG
+        When sending v1/reverse with format xml
+          | lat      | lon     | polygon_svg |
+          | 47.06597 | 9.50467 | 1           |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result contains
+          | geosvg |
+          | M 9.5039353 -47.0657546 L 9.5040437 -47.0657781 9.5040808 -47.065787 9.5054298 -47.0661407 |
+
+    Scenario: Reverse XML - Output of KML
+       When sending v1/reverse with format xml
+          | lat      | lon     | polygon_kml |
+          | 47.06597 | 9.50467 | 1           |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+       And the result contains
+          | geokml!fm |
+          | <geokml><LineString><coordinates>9.5039\d*,47.0657\d* 9.5040\d*,47.0657\d* 9.5040\d*,47.065\d* 9.5054\d*,47.0661\d*</coordinates></LineString></geokml> |
diff --git a/test/bdd/features/api/search/language.feature b/test/bdd/features/api/search/language.feature
new file mode 100644
index 00000000..ead4f88f
--- /dev/null
+++ b/test/bdd/features/api/search/language.feature
@@ -0,0 +1,83 @@
+Feature: Localization of search results
+
+    Scenario: Search - default language
+        When sending v1/search
+          | q |
+          | Liechtenstein |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And result 0 contains
+          | display_name |
+          | Liechtenstein |
+
+    Scenario: Search - accept-language first
+        When sending v1/search
+          | q             | accept-language |
+          | Liechtenstein | zh,de |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And result 0 contains
+          | display_name |
+          | åæ¯æ¦å£«ç» |
+
+    Scenario: Search - accept-language missing
+        When sending v1/search
+          | q             | accept-language |
+          | Liechtenstein | xx,fr,en,de |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And result 0 contains
+          | display_name |
+          | Liechtenstein |
+
+    Scenario: Search - http accept language header first
+        Given the HTTP header
+          | accept-language |
+          | fo;q=0.8,en-ca;q=0.5,en;q=0.3 |
+        When sending v1/search
+          | q |
+          | Liechtenstein |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And result 0 contains
+          | display_name |
+          | Liktinstein |
+
+    Scenario: Search - http accept language header and accept-language
+        Given the HTTP header
+          | accept-language |
+          | fr-ca,fr;q=0.8,en-ca;q=0.5,en;q=0.3 |
+        When sending v1/search
+          | q | accept-language |
+          | Liechtenstein | fo,en |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And result 0 contains
+          | display_name |
+          | Liktinstein |
+
+    Scenario: Search - http accept language header fallback
+        Given the HTTP header
+          | accept-language |
+          | fo-ca,en-ca;q=0.5 |
+        When sending v1/search
+          | q |
+          | Liechtenstein |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And result 0 contains
+          | display_name |
+          | Liktinstein |
+
+    Scenario: Search - http accept language header fallback (upper case)
+        Given the HTTP header
+          | accept-language |
+          | fo-FR;q=0.8,en-ca;q=0.5 |
+        When sending v1/search
+          | q |
+          | Liechtenstein |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And result 0 contains
+          | display_name |
+          | Liktinstein |
diff --git a/test/bdd/features/api/search/params.feature b/test/bdd/features/api/search/params.feature
new file mode 100644
index 00000000..d2f41f48
--- /dev/null
+++ b/test/bdd/features/api/search/params.feature
@@ -0,0 +1,361 @@
+Feature: Search queries
+    Testing different queries and parameters
+
+    Scenario: Simple XML search
+        When sending v1/search with format xml
+          | q |
+          | Schaan |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And all results have attributes place_id,osm_type,osm_id
+        And all results have attributes place_rank,boundingbox
+        And all results have attributes lat,lon,display_name
+        And all results have attributes class,type,importance
+        And all results have no attributes address
+        And all results contain
+          | boundingbox!in_box |
+          | 46.5,47.5,9,10 |
+
+    Scenario Outline: Simple JSON search
+        When sending v1/search with format <format>
+          | q |
+          | Vaduz |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And all results have attributes place_id,licence,<cname>,type
+        And all results have attributes osm_type,osm_id,boundingbox
+        And all results have attributes lat,lon,display_name,importance
+        And all results have no attributes address
+        And all results contain
+          | boundingbox!in_box |
+          | 46.5,47.5,9,10 |
+
+        Examples:
+          | format | cname    |
+          | json   | class    |
+          | jsonv2 | category |
+
+    Scenario: Unknown formats returns a user error
+        When sending v1/search with format x45
+          | q |
+          | Vaduz |
+        Then a HTTP 400 is returned
+
+    Scenario Outline: Search with addressdetails
+        When sending v1/search with format <format>
+          | q       | addressdetails |
+          | Triesen | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And result 0 contains in field address
+          | param        | value |
+          | village      | Triesen |
+          | county       | Oberland |
+          | postcode     | 9495 |
+          | country      | Liechtenstein |
+          | country_code | li |
+          | ISO3166-2-lvl8 | LI-09 |
+
+        Examples:
+          | format | outformat |
+          | json   | json |
+          | jsonv2 | json |
+          | geojson | geojson |
+          | xml    | xml |
+
+    Scenario: Coordinate search with addressdetails
+        When geocoding "47.12400621,9.6047552"
+          | accept-language |
+          | en |
+        Then all results contain
+          | display_name |
+          | Guschg, Valorschstrasse, Balzers, Oberland, 9497, Liechtenstein |
+
+    Scenario: Address details with unknown class types
+        When geocoding "Kloster St. Elisabeth"
+        Then result 0 contains
+          | category | type      | address+amenity |
+          | amenity  | monastery | Kloster St. Elisabeth |
+
+    Scenario: Disabling deduplication
+        When geocoding "Malbunstr, Schaan"
+        Then exactly 1 result is returned
+        When geocoding "Malbunstr, Schaan"
+          | dedupe |
+          | 0 |
+        Then exactly 4 results are returned
+
+    Scenario: Search with bounded viewbox in right area
+        When geocoding "post"
+          | bounded | viewbox |
+          | 1       |  9,47,10,48 |
+        Then result 0 contains
+          | address+town |
+          | Vaduz |
+        When geocoding "post"
+          | bounded | viewbox |
+          | 1       |  9.49712,47.17122,9.52605,47.16242 |
+        Then result 0 contains
+          | address+town |
+          | Schaan |
+
+    Scenario: Country search with bounded viewbox remain in the area
+        When geocoding
+          | bounded | viewbox                           | country |
+          | 1       | 9.49712,47.17122,9.52605,47.16242 | de |
+        Then exactly 0 results are returned
+
+    Scenario: Search with bounded viewboxlbrt in right area
+        When geocoding "bar"
+          | bounded | viewboxlbrt |
+          | 1       | 9.49712,47.16242,9.52605,47.17122 |
+        Then all results contain
+          | address+town |
+          | Schaan |
+
+    Scenario: No POI search with unbounded viewbox
+        When geocoding "restaurant"
+          | viewbox |
+          | 9.93027,53.61634,10.10073,53.54500 |
+        Then all results contain
+          | display_name!fm |
+          | .*[Rr]estaurant.* |
+
+    Scenario: bounded search remains within viewbox, even with no results
+         When geocoding "[restaurant]"
+           | bounded | viewbox |
+           | 1       | 43.5403125,-5.6563282,43.54285,-5.662003 |
+        Then exactly 0 results are returned
+
+    Scenario: bounded search remains within viewbox with results
+        When geocoding "restaurant"
+         | bounded | viewbox |
+         | 1       | 9.49712,47.17122,9.52605,47.16242 |
+        Then all results contain
+         | boundingbox!in_box |
+         | 47.16242,47.17122,9.49712,9.52605 |
+
+    Scenario: Prefer results within viewbox
+        When geocoding "GÃ¤ssle"
+          | accept-language | viewbox |
+          | en              | 9.52413,47.10759,9.53140,47.10539 |
+        Then result 0 contains
+          | address+village |
+          | Triesen |
+        When geocoding "GÃ¤ssle"
+          | accept-language | viewbox |
+          | en              | 9.45949,47.08421,9.54094,47.05466 |
+        Then result 0 contains
+          | address+town |
+          | Balzers |
+
+    Scenario: viewboxes cannot be points
+        When sending v1/search
+          | q   | viewbox |
+          | foo | 1.01,34.6,1.01,34.6 |
+        Then a HTTP 400 is returned
+
+    Scenario Outline: viewbox must have four coordinate numbers
+        When sending v1/search
+          | q   | viewbox |
+          | foo | <viewbox> |
+        Then a HTTP 400 is returned
+
+    Examples:
+        | viewbox |
+        | 34      |
+        | 0.003,-84.4 |
+        | 5.2,4.5542,12.4 |
+        | 23.1,-6,0.11,44.2,9.1 |
+
+    Scenario Outline: viewboxlbrt must have four coordinate numbers
+        When sending v1/search
+          | q   | viewboxlbrt |
+          | foo | <viewbox> |
+        Then a HTTP 400 is returned
+
+    Examples:
+        | viewbox |
+        | 34      |
+        | 0.003,-84.4 |
+        | 5.2,4.5542,12.4 |
+        | 23.1,-6,0.11,44.2,9.1 |
+
+    Scenario: Overly large limit number for search results
+        When geocoding "restaurant"
+          | limit |
+          | 1000 |
+        Then exactly 35 results are returned
+
+    Scenario: Limit number of non-duplicated search results
+        When geocoding "landstr"
+          | dedupe |
+          | 0      |
+        Then exactly 10 results are returned
+        When geocoding "landstr"
+          | limit | dedupe |
+          | 4     | 0      |
+        Then exactly 4 results are returned
+
+    Scenario: Limit parameter must be a number
+        When sending v1/search
+          | q           | limit |
+          | Blue Laguna | );    |
+        Then a HTTP 400 is returned
+
+    Scenario: Restrict to feature type country
+        When geocoding "fÃ¼rstentum"
+          | featureType |
+          | country |
+        Then all results contain
+          | place_rank |
+          | 4 |
+
+    Scenario: Restrict to feature type state
+        When geocoding "Wangerberg"
+        Then more than 0 results are returned
+        When geocoding "Wangerberg"
+          | featureType |
+          | state |
+        Then exactly 0 results are returned
+
+    Scenario: Restrict to feature type city
+        When geocoding "vaduz"
+          | featureType |
+          | state |
+        Then exactly 0 results are returned
+        When geocoding "vaduz"
+          | featureType |
+          | city |
+        Then more than 0 results are returned
+        Then all results contain
+          | place_rank |
+          | 16 |
+
+    Scenario: Restrict to feature type settlement
+        When geocoding "Malbun"
+        Then result 1 contains
+          | category |
+          | landuse |
+        When geocoding "Malbun"
+          | featureType |
+          | settlement |
+        Then all results contain
+          | category | type |
+          | place    | village |
+
+    Scenario Outline: Search with polygon threshold (json)
+        When sending v1/search with format json
+          | q           | polygon_geojson | polygon_threshold |
+          | Triesenberg | 1               | <th> |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And more than 0 results are returned
+        And all results have attributes geojson
+
+        Examples:
+          | th |
+          | -1 |
+          | 0.0 |
+          | 0.5 |
+          | 999 |
+
+    Scenario Outline: Search with polygon threshold (xml)
+        When sending v1/search with format xml
+          | q           | polygon_geojson | polygon_threshold |
+          | Triesenberg | 1               | <th> |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And more than 0 results are returned
+        And all results have attributes geojson
+
+        Examples:
+          | th |
+          | -1 |
+          | 0.0 |
+          | 0.5 |
+          | 999 |
+
+    Scenario Outline: Search with invalid polygon threshold (xml)
+        When sending v1/search with format xml
+          | q           | polygon_geojson | polygon_threshold |
+          | Triesenberg | 1               | <th> |
+        Then a HTTP 400 is returned
+
+        Examples:
+          | th |
+          | x |
+          | ;; |
+          | 1m |
+
+    Scenario Outline: Search with extratags
+        When sending v1/search with format <format>
+          | q       | extratags |
+          | Landstr | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And more than 0 results are returned
+        Then all results have attributes extratags
+
+        Examples:
+          | format | outformat |
+          | xml    | xml |
+          | json   | json |
+          | jsonv2 | json |
+          | geojson | geojson |
+
+    Scenario Outline: Search with namedetails
+        When sending v1/search with format <format>
+          | q       | namedetails |
+          | Landstr | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And more than 0 results are returned
+        Then all results have attributes namedetails
+
+        Examples:
+          | format | outformat |
+          | xml    | xml |
+          | json   | json |
+          | jsonv2 | json |
+          | geojson | geojson |
+
+    Scenario Outline: Search result with contains formatted geometry
+        When sending v1/search with format <format>
+          | q           | <param> |
+          | Triesenberg | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And more than 0 results are returned
+        And all results have attributes <response_attribute>
+
+        Examples:
+          | format   | outformat | param        | response_attribute |
+          | xml      | xml       | polygon_text | geotext |
+          | json     | json      | polygon_text | geotext |
+          | jsonv2   | json      | polygon_text | geotext |
+          | xml      | xml       |  polygon_svg | geosvg |
+          | json     | json      |  polygon_svg | svg |
+          | jsonv2   | json      |  polygon_svg | svg |
+          | xml      | xml       | polygon_kml  | geokml |
+          | json     | json      | polygon_kml  | geokml |
+          | jsonv2   | json      | polygon_kml  | geokml |
+          | xml      | xml       | polygon_geojson | geojson |
+          | json     | json      | polygon_geojson | geojson |
+          | jsonv2   | json      | polygon_geojson | geojson |
+          | geojson  | geojson   | polygon_geojson | geojson |
+
+    Scenario Outline: Search result in geojson format contains no non-geojson geometry
+        When sending v1/search with format geojson
+          | q           | <param> |
+          | Triesenberg | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid geojson
+        And more than 0 results are returned
+        And all results have no attributes <response_attribute>
+
+        Examples:
+          | param        | response_attribute |
+          | polygon_text | geotext            |
+          | polygon_svg  | svg                |
+          | polygon_kml  | geokml             |
diff --git a/test/bdd/api/search/postcode.feature b/test/bdd/features/api/search/postcode.feature
similarity index 58%
rename from test/bdd/api/search/postcode.feature
rename to test/bdd/features/api/search/postcode.feature
index bb1b755b..56242ec3 100644
--- a/test/bdd/api/search/postcode.feature
+++ b/test/bdd/features/api/search/postcode.feature
@@ -1,52 +1,51 @@
-@SQLITE
-@APIDB
 Feature: Searches with postcodes
     Various searches involving postcodes
 
-    @Fail
     Scenario: US 5+4 ZIP codes are shortened to 5 ZIP codes if not found
-        When sending json search query "36067 1111, us" with address
-        Then result addresses contain
+        When geocoding "36067-1111, us"
+        Then all results contain in field address
             | postcode |
             | 36067    |
-        And results contain
+        And all results contain
             | type     |
             | postcode |
 
     Scenario: Postcode search with address
-        When sending json search query "9486, mauren"
-        Then at least 1 result is returned
+        When geocoding "9486, mauren"
+        Then result 0 contains
+            | type     |
+            | postcode |
 
     Scenario: Postcode search with country
-        When sending json search query "9486, li" with address
-        Then result addresses contain
+        When geocoding "9486, li"
+        Then all results contain in field address
             | country_code |
             | li           |
 
     Scenario: Postcode search with country code restriction
-        When sending json search query "9490" with address
+        When geocoding "9490"
             | countrycodes |
             | li |
-        Then result addresses contain
+        Then all results contain in field address
             | country_code |
             | li           |
 
     Scenario: Postcode search with bounded viewbox restriction
-        When sending json search query "9486" with address
+        When geocoding "9486"
           | bounded | viewbox |
           | 1       | 9.55,47.20,9.58,47.22 |
-        Then result addresses contain
+        Then all results contain in field address
             | postcode |
             | 9486     |
-        When sending json search query "9486" with address
+        When geocoding "9486"
           | bounded | viewbox                 |
           | 1       | 5.00,20.00,6.00,21.00 |
-        Then exactly 0 results are returned
+        Then exactly 0 result is returned
 
     Scenario: Postcode search with structured query
-        When sending json search query "" with address
+        When geocoding ""
             | postalcode | country |
             | 9490       | li |
-        Then result addresses contain
+        Then all results contain in field address
             | country_code | postcode |
             | li           | 9490     |
diff --git a/test/bdd/features/api/search/queries.feature b/test/bdd/features/api/search/queries.feature
new file mode 100644
index 00000000..8453b53b
--- /dev/null
+++ b/test/bdd/features/api/search/queries.feature
@@ -0,0 +1,212 @@
+Feature: Search queries
+    Generic search result correctness
+
+    Scenario: Search for natural object
+        When geocoding "Samina"
+          | accept-language |
+          | en |
+        Then result 0 contains
+          | category | type  | display_name    |
+          | waterway | river | Samina, Austria |
+
+    Scenario: House number search for non-street address
+        When geocoding "6 Silum, Liechtenstein"
+          | accept-language |
+          | en |
+        Then result 0 contains in field address
+          | param        | value |
+          | house_number | 6 |
+          | village      | Silum |
+          | town         | Triesenberg |
+          | county       | Oberland |
+          | postcode     | 9497 |
+          | country      | Liechtenstein |
+          | country_code | li |
+          | ISO3166-2-lvl8  | LI-10 |
+
+    Scenario: Search for house number interpolation
+        When geocoding "Grosssteg 1023, Triesenberg"
+          | accept-language |
+          | de |
+        Then result 0 contains in field address
+          | param         | value |
+          | house_number  | 1023 |
+          | road          | Grosssteg |
+          | village       | SÃ¼cka |
+          | postcode      | 9497 |
+          | town          | Triesenberg |
+          | country       | Liechtenstein |
+          | country_code  | li |
+
+    Scenario: With missing housenumber search falls back to road
+        When geocoding "BÃ¼ndaweg 555"
+        Then result 0 contains in field address
+          | param         | value |
+          | road          | BÃ¼ndaweg |
+          | village       | Silum |
+          | postcode      | 9497 |
+          | county        | Oberland |
+          | town          | Triesenberg |
+          | country       | Liechtenstein |
+          | country_code  | li |
+          | ISO3166-2-lvl8  | LI-10 |
+        And all results have no attributes address+house_number
+
+    Scenario Outline: Housenumber 0 can be found
+        When sending v1/search with format <format>
+          | q              | addressdetails |
+          | Gnalpstrasse 0 | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And all results contain
+          | display_name!fm | address+house_number |
+          | 0,.*            | 0 |
+
+    Examples:
+        | format      | outformat |
+        | xml         | xml       |
+        | json        | json      |
+        | jsonv2      | json      |
+        | geojson     | geojson   |
+
+    Scenario: TIGER house number
+        When geocoding "697 Upper Kingston Road"
+        Then all results contain
+         | osm_type | display_name!fm | address+house_number |
+         | way      | 697,.*          | 697 |
+
+    Scenario: Search with class-type feature
+        When geocoding "bars in ebenholz"
+        Then all results contain
+          | place_rank |
+          | 30 |
+
+    Scenario: Search with specific amenity
+        When geocoding "[restaurant] Vaduz"
+        Then all results contain
+          | category | type       | address+country |
+          | amenity  | restaurant | Liechtenstein |
+
+    Scenario: Search with specific amenity also work in country
+        When geocoding "restaurants in liechtenstein"
+        Then all results contain
+          | category | type       | address+country |
+          | amenity  | restaurant | Liechtenstein |
+
+    Scenario: Search with key-value amenity
+        When geocoding "[club=scout] Vaduz"
+        Then all results contain
+          | category | type |
+          | club     | scout |
+
+    Scenario: POI search near given coordinate
+        When geocoding "restaurant near 47.16712,9.51100"
+        Then all results contain
+          | category | type |
+          | amenity  | restaurant |
+
+    Scenario: Arbitrary key/value search near given coordinate
+        When geocoding "[leisure=firepit]   47.150Â° N 9.5340493Â° E"
+        Then all results contain
+          | category | type |
+          | leisure  | firepit |
+
+    Scenario: POI search in a bounded viewbox
+        When geocoding "restaurants"
+          | viewbox                           | bounded |
+          | 9.50830,47.15253,9.52043,47.14866 | 1 |
+        Then all results contain
+          | category | type       |
+          | amenity  | restaurant |
+
+    Scenario Outline: Key/value search near given coordinate can be restricted to country
+        When geocoding "[natural=peak] 47.06512,9.53965"
+          | countrycodes |
+          | <cc> |
+        Then all results contain
+          | address+country_code |
+          | <cc> |
+
+        Examples:
+            | cc |
+            | li |
+            | ch |
+
+    Scenario: Name search near given coordinate
+        When geocoding "sporry"
+        Then result 0 contains
+          | address+town |
+          | Vaduz |
+        When geocoding "sporry, 47.10791,9.52676"
+        Then result 0 contains
+          | address+village |
+          | Triesen |
+
+    Scenario: Name search near given coordinate without result
+        When geocoding "sporry, N 47 15 7 W 9 61 26"
+        Then exactly 0 results are returned
+
+    Scenario: Arbitrary key/value search near a road
+        When geocoding "[amenity=drinking_water] WissflÃ¤ckaweg"
+        Then all results contain
+          | category | type |
+          | amenity  | drinking_water |
+
+    Scenario: Ignore other country codes in structured search with country
+        When geocoding
+            | countrycodes | country |
+            | li           | de      |
+        Then exactly 0 results are returned
+
+    Scenario: Ignore country searches when query is restricted to countries
+        When geocoding "fr"
+        Then all results contain
+            | name |
+            | France |
+        When geocoding "fr"
+            | countrycodes |
+            | li  |
+        Then exactly 0 results are returned
+
+    Scenario: Country searches only return results for the given country
+        When geocoding "Ans Trail"
+            | countrycodes |
+            | li |
+        Then all results contain
+            | address+country_code |
+            | li |
+
+    # https://trac.openstreetmap.org/ticket/5094
+    Scenario: housenumbers are ordered by complete match first
+        When geocoding "Austrasse 11, Vaduz"
+        Then result 0 contains
+          | address+house_number |
+          | 11 |
+
+    Scenario Outline: Coordinate searches with white spaces
+        When geocoding "<data>"
+        Then the result set contains exactly
+          | category |
+          | water    |
+
+        Examples:
+          | data |
+          | sporry weiher, N 47.10791Â° E 9.52676Â° |
+          | sporry weiher,	N 47.10791Â° E 9.52676Â° |
+          | 	sporry weiher	, 	N 47.10791Â° E 9.52676Â° |
+          | sporry weiher, N 47.10791Â° 		E 9.52676Â° |
+          | sporry weiher, N 47.10791Â° E	9.52676Â° |
+
+    Scenario: Searches with white spaces
+        When geocoding "52	Bodastr,Triesenberg"
+        Then all results contain
+          | category | type |
+          | highway  | residential |
+
+
+    # github #1949
+    Scenario: Addressdetails always return the place type
+       When geocoding "Vaduz"
+       Then result 0 contains
+         | address+town |
+         | Vaduz |
diff --git a/test/bdd/features/api/search/simple.feature b/test/bdd/features/api/search/simple.feature
new file mode 100644
index 00000000..3dc76922
--- /dev/null
+++ b/test/bdd/features/api/search/simple.feature
@@ -0,0 +1,166 @@
+Feature: Simple Tests
+    Simple tests for internal server errors and response format.
+
+    Scenario Outline: Garbage Searches
+        When sending v1/search
+          | q |
+          | <query> |
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And exactly 0 results are returned
+
+    Examples:
+     | query |
+     | New York, New York |
+     | 12, Main Street, Houston |
+     | MÃ¼nchen |
+     | æ±äº¬é½ |
+     | hotels in sdfewf |
+     | xywxkrf |
+     | gh; foo() |
+     | %#$@*&l;der#$! |
+     | 234.23.14.5 |
+     | aussenstelle universitat lichtenstein wachterhaus aussenstelle universitat lichtenstein wachterhaus aussenstelle universitat lichtenstein wachterhaus aussenstelle universitat lichtenstein wachterhaus |
+
+    Scenario: Empty XML search
+        When sending v1/search with format xml
+          | q        |
+          | xnznxvcx |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        Then the result metadata contains
+          | param       | value |
+          | querystring | xnznxvcx |
+          | more_url!fm | .*q=xnznxvcx.*format=xml |
+
+    Scenario: Empty XML search with special XML characters
+        When sending v1/search with format xml
+          | q |
+          | xfdghn&zxn"xvbyx<vxx>cssdex |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        Then the result metadata contains
+          | param       | value |
+          | querystring | xfdghn&zxn"xvbyx<vxx>cssdex |
+          | more_url!fm | .*q=xfdghn%26zxn%22xvbyx%3Cvxx%3Ecssdex.*format=xml |
+
+    Scenario: Empty XML search with viewbox
+        When sending v1/search with format xml
+          | q        | viewbox |
+          | xnznxvcx | 12,33,77,45.13 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result metadata contains
+          | param        | value |
+          | querystring | xnznxvcx |
+          | viewbox     | 12,33,77,45.13 |
+
+    Scenario: Empty XML search with viewboxlbrt
+        When sending v1/search with format xml
+          | q        | viewboxlbrt |
+          | xnznxvcx | 12,34.13,77,45 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result metadata contains
+          | param       | value |
+          | querystring | xnznxvcx |
+          | viewbox     | 12,34.13,77,45 |
+
+    Scenario: Empty XML search with viewboxlbrt and viewbox
+        When sending v1/search with format xml
+          | q   | viewbox        | viewboxblrt |
+          | pub | 12,33,77,45.13 | 1,2,3,4 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result metadata contains
+          | param       | value |
+          | querystring | pub |
+          | viewbox     | 12,33,77,45.13 |
+
+    Scenario: Empty XML search with excluded place ids
+        When sending v1/search with format xml
+          | q              | exclude_place_ids |
+          | jghrleoxsbwjer | 123,76,342565 |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result metadata contains
+          | param             | value |
+          | exclude_place_ids | 123,76,342565 |
+
+    Scenario: Empty XML search with bad excluded place ids
+        When sending v1/search with format xml
+          | q              | exclude_place_ids |
+          | jghrleoxsbwjer | , |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result metadata has no attributes exclude_place_ids
+
+    Scenario Outline: Wrapping of illegal jsonp search requests
+        When sending v1/search with format json
+          | q     | json_callback |
+          | Tokyo | <data> |
+        Then a HTTP 400 is returned
+        And the result is valid json
+        And the result contains
+          | error+code | error+message |
+          | 400        | Invalid json_callback value |
+
+        Examples:
+          | data |
+          | 1asd |
+          | bar(foo) |
+          | XXX['bad'] |
+          | foo; evil |
+          | 234 |
+
+    Scenario: Ignore jsonp parameter for anything but json
+        When sending v1/search with format xml
+          | q     | json_callback |
+          | Tokyo | 234 |
+        Then a HTTP 200 is returned
+        Then the result is valid xml
+
+    Scenario Outline: Empty search for json like
+        When sending v1/search with format <format>
+          | q |
+          | YHlERzzx |
+        Then a HTTP 200 is returned
+        And the result is valid <outformat>
+        And exactly 0 results are returned
+
+        Examples:
+          | format | outformat |
+          | json   | json |
+          | jsonv2 | json |
+          | geojson | geojson |
+          | geocodejson | geocodejson |
+
+    Scenario: Search for non-existing coordinates
+        When geocoding "-21.0,-33.0"
+        Then exactly 0 results are returned
+
+    Scenario: Country code selection is retained in more URL (#596)
+        When sending v1/search with format xml
+          | q     | countrycodes |
+          | Vaduz | pl,1,,invalid,undefined,%3Cb%3E,bo,, |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result metadata contains
+          | more_url!fm |
+          | .*&countrycodes=pl%2Cbo&.* |
+
+    Scenario Outline: Search debug output does not return errors
+        When sending v1/search
+          | q       | debug |
+          | <query> | 1     |
+        Then a HTTP 200 is returned
+        And the result is valid html
+
+        Examples:
+          | query |
+          | Liechtenstein |
+          | Triesen |
+          | Pfarrkirche |
+          | Landstr 27 Steinort, Triesenberg, 9495 |
+          | 9497 |
+          | restaurant in triesen |
diff --git a/test/bdd/features/api/search/structured.feature b/test/bdd/features/api/search/structured.feature
new file mode 100644
index 00000000..60f0f309
--- /dev/null
+++ b/test/bdd/features/api/search/structured.feature
@@ -0,0 +1,72 @@
+Feature: Structured search queries
+    Testing correctness of results with
+    structured queries
+
+    Scenario: Structured search for country only
+        When geocoding
+          | country |
+          | Liechtenstein |
+        Then all results contain in field address
+          | country_code | country       |
+          | li           | Liechtenstein |
+
+    Scenario: Structured search for postcode only
+        When geocoding
+          | postalcode |
+          | 9495 |
+        Then all results contain
+          | type!fm         | address+postcode |
+          | ^post(al_)?code | 9495             |
+
+    Scenario: Structured search for street, postcode and country
+        When sending v1/search with format xml
+          | street          | postalcode | country        |
+          | Old Palace Road | GU2 7UP    | United Kingdom |
+        Then a HTTP 200 is returned
+        And the result is valid xml
+        And the result metadata contains
+          | querystring |
+          | Old Palace Road, GU2 7UP, United Kingdom |
+
+    Scenario: Structured search for street with housenumber, city and postcode
+        When geocoding
+          | street             | city  | postalcode |
+          | 19 Am schrÃ¤gen Weg | Vaduz | 9490       |
+        Then all results contain in field address
+          | house_number | road |
+          | 19           | Am SchrÃ¤gen Weg |
+
+    Scenario: Structured search for street with housenumber, city and bad postcode
+        When geocoding
+          | street             | city  | postalcode |
+          | 19 Am schrÃ¤gen Weg | Vaduz | 9491       |
+        Then all results contain in field address
+          | house_number | road |
+          | 19           | Am SchrÃ¤gen Weg |
+
+    Scenario: Structured search for amenity, city
+        When geocoding
+          | city  | amenity |
+          | Vaduz | bar  |
+        Then all results contain
+          | address+country | category | type!fm |
+          | Liechtenstein   | amenity  | (pub)\|(bar)\|(restaurant) |
+
+    #176
+    Scenario: Structured search restricts rank
+        When geocoding
+          | city |
+          | Steg |
+        Then all results contain
+          | addresstype |
+          | village |
+
+    #3651
+    Scenario: Structured search with surrounding extra characters
+        When geocoding
+          | street               | city  | postalcode |
+          | "19 Am schrÃ¤gen Weg" | "Vaduz" | "9491"  |
+        Then all results contain in field address
+          | house_number | road |
+          | 19           | Am SchrÃ¤gen Weg |
+
diff --git a/test/bdd/features/api/search/v1_geocodejson.feature b/test/bdd/features/api/search/v1_geocodejson.feature
new file mode 100644
index 00000000..99fff0e4
--- /dev/null
+++ b/test/bdd/features/api/search/v1_geocodejson.feature
@@ -0,0 +1,42 @@
+Feature: Search API geocodejson output
+    Testing correctness of geocodejson output.
+
+    Scenario: Search geocodejson - City housenumber-level address with street
+        When sending v1/search with format geocodejson
+          | q                    | addressdetails |
+          | Im Winkel 8, Triesen | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson
+        And all results contain
+          | housenumber | street    | postcode | city    | country |
+          | 8           | Im Winkel | 9495     | Triesen | Liechtenstein |
+
+    Scenario: Search geocodejson - Town street-level address with street
+        When sending v1/search with format geocodejson
+          | q                | addressdetails |
+          | Gnetsch, Balzers | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson
+        And all results contain
+          | name    | city    | postcode | country |
+          | Gnetsch | Balzers | 9496     | Liechtenstein |
+
+    Scenario: Search geocodejson - Town street-level address with footway
+        When sending v1/search with format geocodejson
+          | q                                    | addressdetails |
+          | burg gutenberg 6000 jahre geschichte | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson
+        And all results contain
+          | street  | city    | postcode | country |
+          | Burgweg | Balzers | 9496     | Liechtenstein |
+
+    Scenario: Search geocodejson - City address with suburb
+        When sending v1/search with format geocodejson
+          | q                           | addressdetails |
+          | Lochgass 5, Ebenholz, Vaduz | 1 |
+        Then a HTTP 200 is returned
+        And the result is valid geocodejson
+        And all results contain
+          | housenumber | street   | district | city  | postcode | country |
+          | 5           | Lochgass | Ebenholz | Vaduz | 9490     | Liechtenstein |
diff --git a/test/bdd/features/api/status/failures.feature b/test/bdd/features/api/status/failures.feature
new file mode 100644
index 00000000..b66bf324
--- /dev/null
+++ b/test/bdd/features/api/status/failures.feature
@@ -0,0 +1,19 @@
+Feature: Status queries against unknown database
+    Testing status query
+
+    Background:
+        Given an unknown database
+
+    Scenario: Failed status as text
+        When sending v1/status
+        Then a HTTP 500 is returned
+        And the page content equals "ERROR: Database connection failed"
+
+    Scenario: Failed status as json
+        When sending v1/status with format json
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | status!:d | message |
+          | 700       | Database connection failed |
+        And the result has no attributes data_updated
diff --git a/test/bdd/features/api/status/simple.feature b/test/bdd/features/api/status/simple.feature
new file mode 100644
index 00000000..23ba0934
--- /dev/null
+++ b/test/bdd/features/api/status/simple.feature
@@ -0,0 +1,15 @@
+Feature: Status queries
+    Testing status query
+
+    Scenario: Status as text
+        When sending v1/status
+        Then a HTTP 200 is returned
+        And the page content equals "OK"
+
+    Scenario: Status as json
+        When sending v1/status with format json
+        Then a HTTP 200 is returned
+        And the result is valid json
+        And the result contains
+          | status!:d | message | data_updated!fm |
+          | 0         | OK      | ....-..-..T..:..:...00:00 |
diff --git a/test/bdd/db/import/addressing.feature b/test/bdd/features/db/import/addressing.feature
similarity index 84%
rename from test/bdd/db/import/addressing.feature
rename to test/bdd/features/db/import/addressing.feature
index e7c91207..e61a4777 100644
--- a/test/bdd/db/import/addressing.feature
+++ b/test/bdd/features/db/import/addressing.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Address computation
     Tests for filling of place_addressline
 
@@ -11,16 +10,13 @@ Feature: Address computation
             | N2  | place | hamlet   | West Farm | 2 |
             | N3  | place | hamlet   | East Farm | 3 |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
             | object | address | fromarea |
             | N1     | N3      | False |
-        Then place_addressline doesn't contain
-            | object | address |
-            | N1     | N2      |
-        When sending search query "Square"
-        Then results contain
-           | osm | display_name      |
-           | N1  | Square, East Farm |
+        When geocoding "Square"
+        Then the result set contains
+           | object | display_name      |
+           | N1     | Square, East Farm |
 
     Scenario: given two place nodes, the closer one wins for the address
         Given the grid
@@ -102,12 +98,9 @@ Feature: Address computation
             | N2  | place    | city    | 15    | 9 |
             | R1  | place    | city    | 8     | (1,2,3,4,1) |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
             | object | address | isaddress | cached_rank_address |
             | N1     | R1      | True      | 16                  |
-        And place_addressline doesn't contain
-            | object | address |
-            | N1     | N2      |
 
 
     Scenario: place nodes close enough to smaller ranked place nodes are included
@@ -191,12 +184,9 @@ Feature: Address computation
             | W10 | boundary | administrative | 5     | (1, 2, 8, 5, 4, 1) |
             | W11 | boundary | administrative | 5     | (2, 3, 6, 5, 8, 2) |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
             | object | address | cached_rank_address |
             | W1     | W10     | 10                  |
-        Then place_addressline doesn't contain
-            | object | address |
-            | W1     | W11     |
 
     Scenario: Roads should not contain boundaries they touch in a middle point
         Given the grid
@@ -211,12 +201,9 @@ Feature: Address computation
             | W10 | boundary | administrative | 5     | (1, 2, 8, 5, 4, 1) |
             | W11 | boundary | administrative | 5     | (2, 3, 6, 5, 8, 2) |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
             | object | address | cached_rank_address |
             | W1     | W10     | 10                  |
-        Then place_addressline doesn't contain
-            | object | address |
-            | W1     | W11     |
 
     Scenario: Locality points should contain all boundaries they touch
         Given the 0.001 grid
@@ -248,9 +235,8 @@ Feature: Address computation
             | osm | class    | type           | admin | geometry      |
             | W10 | boundary | administrative | 5     | (2, 3, 6, 5, 2) |
         When importing
-        Then place_addressline doesn't contain
+        Then place_addressline contains exactly
             | object | address |
-            | W1     | W10     |
 
     Scenario: buildings with only addr:postcodes do not appear in the address of a way
         Given the grid with origin DE
@@ -273,9 +259,14 @@ Feature: Address computation
             | osm | class    | type        | addr+postcode | geometry |
             | W22 | place    | postcode    | 11234         | (10,11,12,13,10) |
         When importing
-        Then place_addressline doesn't contain
+        Then place_addressline contains exactly
             | object | address  |
-            | W93    | W22      |
+            | R4     | R1       |
+            | R4     | R34      |
+            | R34    | R1       |
+            | W93    | R1       |
+            | W93    | R34      |
+            | W93    | R4       |
 
     Scenario: postcode boundaries do appear in the address of a way
        Given the grid with origin DE
@@ -314,9 +305,8 @@ Feature: Address computation
             | W1  | highway  | residential    | 8, 9     |
             | W2  | place    | square         | (1, 2, 3 ,4, 1) |
         When importing
-        Then place_addressline doesn't contain
+        Then place_addressline contains exactly
             | object | address |
-            | W1     | W2      |
 
     Scenario: addr:* tags are honored even when a street is far away from the place
         Given the grid
@@ -332,14 +322,11 @@ Feature: Address computation
             | W1  | highway | primary | Left      | 8,9      |
             | W2  | highway | primary | Right     | 8,9      |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
            | object | address | isaddress |
            | W1     | R1      | True      |
            | W1     | R2      | False     |
            | W2     | R2      | True      |
-        And place_addressline doesn't contain
-           | object | address |
-           | W2     | R1      |
 
 
     Scenario: addr:* tags are honored even when a POI is far away from the place
@@ -356,17 +343,14 @@ Feature: Address computation
             | W1  | highway | primary | Wonderway | Right     | 8,9      |
             | N1  | amenity | cafe    | Bolder    | Left      | 9        |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
            | object | address | isaddress |
            | W1     | R2      | True      |
            | N1     | R1      | True      |
-        And place_addressline doesn't contain
-           | object | address |
-           | W1     | R1      |
-        When sending search query "Bolder"
-        Then results contain
-           | osm | display_name            |
-           | N1  | Bolder, Wonderway, Left |
+        When geocoding "Bolder"
+        Then the result set contains
+           | object | display_name            |
+           | N1     | Bolder, Wonderway, Left |
 
     Scenario: addr:* tags do not produce addresslines when the parent has the address part
         Given the grid
@@ -381,16 +365,13 @@ Feature: Address computation
             | W1  | highway | primary | Wonderway | Outer     | 8,9      |
             | N1  | amenity | cafe    | Bolder    | Outer     | 9        |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
            | object | address | isaddress |
            | W1     | R1      | True      |
-        And place_addressline doesn't contain
-           | object | address |
-           | N1     | R1      |
-        When sending search query "Bolder"
-        Then results contain
-           | osm | display_name             |
-           | N1  | Bolder, Wonderway, Outer |
+        When geocoding "Bolder"
+        Then the result set contains
+           | object | display_name             |
+           | N1     | Bolder, Wonderway, Outer |
 
     Scenario: addr:* tags on outside do not produce addresslines when the parent has the address part
         Given the grid
@@ -406,17 +387,14 @@ Feature: Address computation
             | W1  | highway | primary | Wonderway | Left      | 8,9      |
             | N1  | amenity | cafe    | Bolder    | Left      | 9        |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
            | object | address | isaddress |
            | W1     | R1      | True      |
            | W1     | R2      | False     |
-        And place_addressline doesn't contain
-           | object | address |
-           | N1     | R1      |
-        When sending search query "Bolder"
-        Then results contain
-           | osm | display_name            |
-           | N1  | Bolder, Wonderway, Left |
+        When geocoding "Bolder"
+        Then the result set contains
+           | object | display_name            |
+           | N1     | Bolder, Wonderway, Left |
 
     Scenario: POIs can correct address parts on the fly
         Given the grid
@@ -433,22 +411,18 @@ Feature: Address computation
             | N1  | amenity | cafe    | Bolder    | 9        |
             | N2  | amenity | cafe    | Leftside  | 8        |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
            | object | address | isaddress |
            | W1     | R1      | False     |
            | W1     | R2      | True      |
-        And place_addressline doesn't contain
-           | object | address |
-           | N1     | R1      |
-           | N2     | R2      |
-        When sending search query "Bolder"
-        Then results contain
-           | osm | display_name            |
-           | N1  | Bolder, Wonderway, Left |
-        When sending search query "Leftside"
-        Then results contain
-           | osm | display_name               |
-           | N2  | Leftside, Wonderway, Right |
+        When geocoding "Bolder"
+        Then the result set contains
+           | object | display_name            |
+           | N1     | Bolder, Wonderway, Left |
+        When geocoding "Leftside"
+        Then the result set contains
+           | object | display_name               |
+           | N2     | Leftside, Wonderway, Right |
 
 
     Scenario: POIs can correct address parts on the fly (with partial unmatching address)
@@ -469,22 +443,18 @@ Feature: Address computation
             | N1  | amenity | cafe    | Bolder    | Boring      | 9        |
             | N2  | amenity | cafe    | Leftside  | Boring      | 8        |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
            | object | address | isaddress |
            | W1     | R1      | True      |
            | W1     | R2      | False     |
-        And place_addressline doesn't contain
-           | object | address |
-           | N1     | R1      |
-           | N2     | R2      |
-        When sending search query "Bolder"
-        Then results contain
-           | osm | display_name            |
-           | N1  | Bolder, Wonderway, Left |
-        When sending search query "Leftside"
-        Then results contain
-           | osm | display_name               |
-           | N2  | Leftside, Wonderway, Right |
+        When geocoding "Bolder"
+        Then the result set contains
+           | object | display_name            |
+           | N1     | Bolder, Wonderway, Left |
+        When geocoding "Leftside"
+        Then the result set contains
+           | object | display_name               |
+           | N2     | Leftside, Wonderway, Right |
 
 
 
@@ -506,30 +476,26 @@ Feature: Address computation
             | N1  | amenity | cafe    | Bolder    | Left       | 9        |
             | N2  | amenity | cafe    | Leftside  | Left       | 8        |
         When importing
-        Then place_addressline contains
+        Then place_addressline contains exactly
            | object | address | isaddress |
            | W1     | R1      | True      |
            | W1     | R2      | False     |
-        And place_addressline doesn't contain
-           | object | address |
-           | N1     | R1      |
-           | N2     | R2      |
-        When sending search query "Bolder"
-        Then results contain
-           | osm | display_name            |
-           | N1  | Bolder, Wonderway, Left |
-        When sending search query "Leftside"
-        Then results contain
-           | osm | display_name               |
-           | N2  | Leftside, Wonderway, Left |
+        When geocoding "Bolder"
+        Then the result set contains
+           | object | display_name            |
+           | N1     | Bolder, Wonderway, Left |
+        When geocoding "Leftside"
+        Then the result set contains
+           | object | display_name               |
+           | N2     | Leftside, Wonderway, Left |
 
 
     Scenario: addr:* tags always match the closer area
         Given the grid
             | 1 |   |   |   |  2 |   | 5 |
             |   |   |   |   |    |   |   |
-            |   | 10| 11|   |    |   |   |
             | 4 |   |   |   |  3 |   | 6 |
+            |   | 10| 11|   |    |   |   |
         And the places
             | osm | class    | type           | admin | name  | geometry    |
             | R1  | boundary | administrative | 8     | Left  | (1,2,3,4,1) |
@@ -538,9 +504,9 @@ Feature: Address computation
             | osm | class   | type    | name      | addr+city | geometry |
             | W1  | highway | primary | Wonderway | Left      | 10,11    |
         When importing
-        Then place_addressline doesn't contain
+        Then place_addressline contains exactly
             | object | address |
-            | W1     | R2      |
+            | W1     | R1      |
 
     Scenario: Full name is prefered for unlisted addr:place tags
         Given the grid
@@ -559,7 +525,7 @@ Feature: Address computation
             | osm | class | type  | housenr | addr+street   | geometry |
             | N2  | place | house | 2       | Royal Terrace | 2        |
         When importing
-        When sending search query "1, Royal Terrace Gardens"
-        Then results contain
-            | ID | osm |
-            | 0  | N1  |
+        When geocoding "1, Royal Terrace Gardens"
+        Then result 0 contains
+            | object |
+            | N1  |
diff --git a/test/bdd/db/import/country.feature b/test/bdd/features/db/import/country.feature
similarity index 84%
rename from test/bdd/db/import/country.feature
rename to test/bdd/features/db/import/country.feature
index bfa46969..90f40d05 100644
--- a/test/bdd/db/import/country.feature
+++ b/test/bdd/features/db/import/country.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Country handling
     Tests for import and use of country information
 
@@ -10,16 +9,16 @@ Feature: Country handling
             | osm  | class    | type          | name  | geometry   |
             | N1   | place    | town          | Wenig | country:de |
         When importing
-        When sending search query "Wenig, Loudou"
-        Then results contain
-            | osm | display_name |
-            | N1  | Wenig, Deutschland |
-        When sending search query "Wenig"
+        When geocoding "Wenig, Loudou"
+        Then the result set contains
+            | object | display_name |
+            | N1     | Wenig, Deutschland |
+        When geocoding "Wenig"
             | accept-language |
             | xy,en |
-        Then results contain
-            | osm | display_name |
-            | N1  | Wenig, Loudou |
+        Then the result set contains
+            | object | display_name |
+            | N1     | Wenig, Loudou |
 
     Scenario: OSM country relations outside expected boundaries are ignored for naming
         Given the grid
@@ -32,12 +31,12 @@ Feature: Country handling
             | osm  | class    | type          | name  | geometry   |
             | N1   | place    | town          | Wenig | country:de |
         When importing
-        When sending search query "Wenig"
+        When geocoding "Wenig"
             | accept-language |
             | xy,en |
-        Then results contain
-            | osm | display_name |
-            | N1  | Wenig, Germany |
+        Then the result set contains
+            | object | display_name |
+            | N1     | Wenig, Germany |
 
     Scenario: Pre-defined country names are used
         Given the grid with origin CH
@@ -46,12 +45,12 @@ Feature: Country handling
             | osm  | class    | type          | name  | geometry   |
             | N1   | place    | town          | Ingb  | 1          |
         When importing
-        And sending search query "Ingb"
+        And geocoding "Ingb"
             | accept-language |
             | en,de |
-        Then results contain
-            | osm | display_name |
-            | N1  | Ingb, Switzerland |
+        Then the result set contains
+            | object | display_name |
+            | N1     | Ingb, Switzerland |
 
     Scenario: For overlapping countries, pre-defined countries are tie-breakers
         Given the grid with origin US
diff --git a/test/bdd/db/import/interpolation.feature b/test/bdd/features/db/import/interpolation.feature
similarity index 96%
rename from test/bdd/db/import/interpolation.feature
rename to test/bdd/features/db/import/interpolation.feature
index 6b784b78..b1f31f8f 100644
--- a/test/bdd/db/import/interpolation.feature
+++ b/test/bdd/features/db/import/interpolation.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Import of address interpolations
     Tests that interpolated addresses are added correctly
 
@@ -60,7 +59,7 @@ Feature: Import of address interpolations
         When importing
         Then W1 expands to interpolation
           | start | end | geometry |
-          | 4     | 6   | 9,8      |
+          | 4     | 6   | 8,9      |
 
     Scenario: Simple odd two point interpolation
         Given the grid with origin 1,1
@@ -227,8 +226,8 @@ Feature: Import of address interpolations
 
     Scenario: Even three point interpolation line with odd center point
         Given the grid
-          | 1 |  | 10 |  |  | 11 | 3 | 2 |
-          | 4 |  |    |  |  |    |   | 5 |
+          | 1 |  | 10 |  | 11 | 3 | 2 |
+          | 4 |  |    |  |    |   | 5 |
         Given the places
           | osm | class | type  | housenr |
           | N1  | place | house | 2       |
@@ -332,14 +331,14 @@ Feature: Import of address interpolations
         Then W11 expands to interpolation
           | parent_place_id | start | end |
           | W3              | 14    | 14 |
-        When sending search query "16 Cloud Street"
-        Then results contain
-         | ID | osm |
-         | 0  | N4  |
-        When sending search query "14 Cloud Street"
-        Then results contain
-         | ID | osm |
-         | 0  | W11 |
+        When geocoding "16 Cloud Street"
+        Then result 0 contains
+         | object |
+         | N4  |
+        When geocoding "14 Cloud Street"
+        Then result 0 contains
+         | object |
+         | W11 |
 
     Scenario: addr:street on housenumber way
         Given the grid
@@ -377,14 +376,14 @@ Feature: Import of address interpolations
         Then W11 expands to interpolation
           | parent_place_id | start | end |
           | W3              | 14    | 14 |
-        When sending search query "16 Cloud Street"
-        Then results contain
-         | ID | osm |
-         | 0  | N4  |
-        When sending search query "14 Cloud Street"
-        Then results contain
-         | ID | osm |
-         | 0  | W11 |
+        When geocoding "16 Cloud Street"
+        Then result 0 contains
+         | object |
+         | N4  |
+        When geocoding "14 Cloud Street"
+        Then result 0 contains
+         | object |
+         | W11 |
 
     Scenario: Geometry of points and way don't match (github #253)
         Given the places
@@ -404,7 +403,7 @@ Feature: Import of address interpolations
         When importing
         Then W1 expands to interpolation
           | start | end | geometry |
-          | 4     | 4   | 144.963016 -37.762946 |
+          | 4     | 4   | 144.96301672 -37.76294644 |
           | 8     | 8   | 144.96314407 -37.762223692 |
 
     Scenario: Place with missing address information
@@ -428,7 +427,7 @@ Feature: Import of address interpolations
         When importing
         Then W1 expands to interpolation
           | start | end | geometry |
-          | 25    | 27  | 0.000016 0,0.00002 0,0.000033 0 |
+          | 25    | 27  | 0.0000166 0,0.00002 0,0.0000333 0 |
 
     Scenario: Ways without node entries are ignored
         Given the places
@@ -478,10 +477,10 @@ Feature: Import of address interpolations
         Then W1 expands to interpolation
           | start | end | geometry |
           | 2     | 8   | 10,11 |
-        When sending v1/reverse at 1,1
-        Then results contain
-          | ID | osm | type  | display_name |
-          | 0  | N1  | house | 0, London Road |
+        When reverse geocoding 1,1
+        Then the result contains
+          | object | type  | display_name |
+          | N1     | house | 0, London Road |
 
     Scenario: Parenting of interpolation with additional tags
         Given the grid
diff --git a/test/bdd/db/import/linking.feature b/test/bdd/features/db/import/linking.feature
similarity index 85%
rename from test/bdd/db/import/linking.feature
rename to test/bdd/features/db/import/linking.feature
index 5bfdbca7..22d5d48e 100644
--- a/test/bdd/db/import/linking.feature
+++ b/test/bdd/features/db/import/linking.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Linking of places
     Tests for correctly determining linked places
 
@@ -53,10 +52,10 @@ Feature: Linking of places
          | W2     | R13 |
          | R13    | -   |
          | R23    | -   |
-        When sending search query "rhein"
-        Then results contain
-         | osm |
-         | R13 |
+        When geocoding "rhein"
+        Then the result set contains
+         | object |
+         | R13    |
 
     Scenario: Relations are not linked when in waterway relations
         Given the grid
@@ -79,11 +78,13 @@ Feature: Linking of places
          | W2     | - |
          | R1     | - |
          | R2     | - |
-        When sending search query "rhein"
-        Then results contain
-          | ID | osm |
-          |  0 | R1  |
-          |  1 | W2  |
+        When geocoding "rhein"
+        Then result 0 contains
+          | object |
+          | R1  |
+        And result 1 contains
+          | object |
+          | W2  |
 
 
     Scenario: Empty waterway relations are handled correctly
@@ -136,9 +137,9 @@ Feature: Linking of places
          | object | linked_place_id |
          | W1     | -  |
          | W2     | R1 |
-        When sending search query "rhein2"
-        Then results contain
-         | osm |
+        When geocoding "rhein2"
+        Then the result set contains
+         | object |
          | W1  |
 
     # github #573
@@ -180,8 +181,8 @@ Feature: Linking of places
          | object  | linked_place_id |
          | N2      | R13 |
         And placex contains
-         | object | centroid | name+name | extratags+linked_place |
-         | R13    | 9        | Garbo     | hamlet |
+         | object | centroid!wkt | name+name | extratags+linked_place |
+         | R13    | 9            | Garbo     | hamlet |
 
     Scenario: Boundaries with place tags are linked against places with same type
         Given the 0.01 grid
@@ -201,18 +202,18 @@ Feature: Linking of places
         And placex contains
          | object | rank_address |
          | R13    | 16 |
-        When sending search query ""
+        When geocoding ""
          | city |
          | Berlin |
-        Then results contain
-          | ID | osm |
-          |  0 | R13 |
-        When sending search query ""
+        Then result 0 contains
+          | object |
+          | R13 |
+        When geocoding ""
          | state |
          | Berlin |
-        Then results contain
-          | ID | osm |
-          |  0 | R13 |
+        Then result 0 contains
+          | object |
+          | R13 |
 
 
     Scenario: Boundaries without place tags only link against same admin level
@@ -233,18 +234,18 @@ Feature: Linking of places
         And placex contains
          | object | rank_address |
          | R13    | 8 |
-        When sending search query ""
+        When geocoding ""
          | state |
          | Berlin |
-        Then results contain
-          | ID | osm |
-          |  0 | R13 |
-        When sending search query ""
+        Then result 0 contains
+          | object |
+          | R13 |
+        When geocoding ""
          | city |
          | Berlin |
-        Then results contain
-          | ID | osm |
-          |  0 | N2  |
+        Then result 0 contains
+          | object |
+          | N2  |
 
     # github #1352
     Scenario: Do not use linked centroid when it is outside the area
@@ -266,8 +267,8 @@ Feature: Linking of places
          | object | linked_place_id |
          | N2     | R13             |
         And placex contains
-         | object | centroid |
-         | R13    | in geometry  |
+         | object | centroid!in_box |
+         | R13    | 0,0,0.1,0.1      |
 
     Scenario: Place nodes can only be linked once
         Given the 0.02 grid
@@ -286,7 +287,7 @@ Feature: Linking of places
          | object | linked_place_id |
          | N2     | R1              |
         And placex contains
-         | object | extratags                |
+         | object | extratags!dict                |
          | R1     | 'linked_place' : 'city', 'wikidata': 'Q1234'  |
          | R2     | 'wikidata': 'Q1234'                     |
 
@@ -310,3 +311,22 @@ Feature: Linking of places
          | object     | name+_place_name  |
          | R1         | LabelPlace |
 
+
+    @skip
+    Scenario: Linked places expand default language names
+        Given the grid
+            | 1 |   | 2 |
+            |   | 9 |   |
+            | 4 |   | 3 |
+        Given the places
+            | osm | class    | type           | name+name                | geometry    |
+            | N9  | place    | city           | PopayÃ¡n                  | 9           |
+            | R1  | boundary | administrative | PerÃ­metro Urbano PopayÃ¡n | (1,2,3,4,1) |
+        And the relations
+            | id | members  |
+            | 1  | N9:label |
+        When importing
+        Then placex contains
+            | object | name+_place_name | name+_place_name:es |
+            | R1     | PopayÃ¡n          | PopayÃ¡n             |
+
diff --git a/test/bdd/features/db/import/naming.feature b/test/bdd/features/db/import/naming.feature
new file mode 100644
index 00000000..944c2de7
--- /dev/null
+++ b/test/bdd/features/db/import/naming.feature
@@ -0,0 +1,104 @@
+Feature: Import and search of names
+    Tests all naming related import issues
+
+    Scenario: No copying name tag if only one name
+        Given the places
+          | osm | class | type      | name+name | geometry |
+          | N1  | place | locality  | german    | country:de |
+        When importing
+        Then placex contains
+          | object | country_code | name+name |
+          | N1     | de           | german |
+
+    Scenario: Copying name tag to default language if it does not exist
+        Given the places
+          | osm | class | type      | name+name | name+name:fi | geometry |
+          | N1  | place | locality  | german    | finnish      | country:de |
+        When importing
+        Then placex contains
+          | object | country_code | name+name | name+name:fi | name+name:de |
+          | N1     | de           | german    | finnish      | german       |
+
+    Scenario: Copying default language name tag to name if it does not exist
+        Given the places
+          | osm | class | type     | name+name:de | name+name:fi | geometry |
+          | N1  | place | locality | german       | finnish      | country:de |
+        When importing
+        Then placex contains
+          | object | country_code | name+name | name+name:fi | name+name:de |
+          | N1     | de           | german    | finnish      | german       |
+
+    Scenario: Do not overwrite default language with name tag
+        Given the places
+          | osm | class | type     | name+name | name+name:fi | name+name:de | geometry |
+          | N1  | place | locality | german    | finnish      | local        | country:de |
+        When importing
+        Then placex contains
+          | object | country_code | name+name | name+name:fi | name+name:de |
+          | N1     | de           | german    | finnish      | local        |
+
+    Scenario Outline: Names in any script can be found
+        Given the places
+            | osm | class | type   | name+name   |
+            | N1  | place | hamlet | <name> |
+        When importing
+        And geocoding "<name>"
+        Then the result set contains
+            | object |
+            | N1  |
+
+     Examples:
+        | name |
+        | Berlin |
+        | åäº¬ |
+        | ÐÐ¾Ð»Ð¾Ð³Ð´Ð° |
+        | ÎÎ¸Î®Î½Î± |
+        | Ø§ÙÙØ§ÙØ±Ø© |
+        | áá¶ááá¶áá¸ááááááá |
+        | æ±äº¬é½ |
+        | áá¯áá¹ááá®áá­ |
+
+
+    Scenario: German umlauts can be found when expanded
+        Given the places
+            | osm | class | type | name+name:de |
+            | N1  | place | city | MÃ¼nster      |
+            | N2  | place | city | KÃ¶ln         |
+            | N3  | place | city | GrÃ¤fenroda   |
+        When importing
+        When geocoding "mÃ¼nster"
+        Then the result set contains
+            | object |
+            | N1  |
+        When geocoding "muenster"
+        Then the result set contains
+            | object |
+            | N1  |
+        When geocoding "munster"
+        Then the result set contains
+            | object |
+            | N1  |
+        When geocoding "KÃ¶ln"
+        Then the result set contains
+            | object |
+            | N2  |
+        When geocoding "Koeln"
+        Then the result set contains
+            | object |
+            | N2  |
+        When geocoding "Koln"
+        Then the result set contains
+            | object |
+            | N2  |
+        When geocoding "grÃ¤fenroda"
+        Then the result set contains
+            | object |
+            | N3  |
+        When geocoding "graefenroda"
+        Then the result set contains
+            | object |
+            | N3  |
+        When geocoding "grafenroda"
+        Then the result set contains
+            | object |
+            | N3  |
diff --git a/test/bdd/db/import/parenting.feature b/test/bdd/features/db/import/parenting.feature
similarity index 98%
rename from test/bdd/db/import/parenting.feature
rename to test/bdd/features/db/import/parenting.feature
index 55fa6a60..2cd09a8d 100644
--- a/test/bdd/db/import/parenting.feature
+++ b/test/bdd/features/db/import/parenting.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Parenting of objects
     Tests that the correct parent is chosen
 
@@ -21,14 +20,14 @@ Feature: Parenting of objects
          | object | parent_place_id |
          | N1     | W1 |
          | N2     | W1 |
-        When sending search query "4 galoo"
-        Then results contain
-         | ID | osm | display_name |
-         | 0  | N1  | 4, galoo, 12345, Deutschland |
-        When sending search query "5 galoo"
-        Then results contain
-         | ID | osm | display_name |
-         | 0  | N2  | 5, galoo, 99999, Deutschland |
+        When geocoding "4 galoo"
+        Then result 0 contains
+         | object | display_name |
+         | N1     | 4, galoo, 12345, Deutschland |
+        When geocoding "5 galoo"
+        Then result 0 contains
+         | object | display_name |
+         | N2     | 5, galoo, 99999, Deutschland |
 
     Scenario: Address without tags, closest street
         Given the grid
@@ -484,9 +483,9 @@ Feature: Parenting of objects
          | N1     | W3              | 3 |
          | N2     | W3              | 3 |
          | N3     | W3              | 3 |
-        When sending geocodejson search query "3, foo" with address
-        Then results contain
-         | housenumber |
+        When geocoding "3, foo"
+        Then the result set contains
+         | address+house_number |
          | 3           |
 
     Scenario: POIs don't inherit from streets
diff --git a/test/bdd/db/import/placex.feature b/test/bdd/features/db/import/placex.feature
similarity index 98%
rename from test/bdd/db/import/placex.feature
rename to test/bdd/features/db/import/placex.feature
index e0e8925f..8c1e4a8a 100644
--- a/test/bdd/db/import/placex.feature
+++ b/test/bdd/features/db/import/placex.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Import into placex
     Tests that data in placex is completed correctly.
 
@@ -8,8 +7,8 @@ Feature: Import into placex
           | N1  | highway | primary  | country:us |
         When importing
         Then placex contains
-          | object | addr+country | country_code |
-          | N1     | -            | us           |
+          | object | address | country_code |
+          | N1     | -       | us           |
 
     Scenario: Location overwrites country code tag
         Given the named places
diff --git a/test/bdd/db/import/postcodes.feature b/test/bdd/features/db/import/postcodes.feature
similarity index 92%
rename from test/bdd/db/import/postcodes.feature
rename to test/bdd/features/db/import/postcodes.feature
index 3f4976f1..7f69b1e1 100644
--- a/test/bdd/db/import/postcodes.feature
+++ b/test/bdd/features/db/import/postcodes.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Import of postcodes
     Tests for postcode estimation
 
@@ -170,18 +169,16 @@ Feature: Import of postcodes
             | object | postcode |
             | W93    | 11200    |
 
-    Scenario: Postcodes are added to the postcode and word table
+    Scenario: Postcodes are added to the postcode
         Given the places
            | osm | class | type  | addr+postcode | addr+housenumber | geometry |
            | N34 | place | house | 01982         | 111              |country:de |
         When importing
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | de      | 01982    | country:de |
-        And there are word tokens for postcodes 01982
+           | country_code | postcode | geometry!wkt |
+           | de           | 01982    | country:de |
 
-
-    @Fail
+    @skip
     Scenario: search and address ranks for GB post codes correctly assigned
         Given the places
          | osm  | class | type     | postcode | geometry |
@@ -190,12 +187,12 @@ Feature: Import of postcodes
          | N3   | place | postcode | Y45      | country:gb |
         When importing
         Then location_postcode contains exactly
-         | postcode | country | rank_search | rank_address |
-         | E45 2CD  | gb      | 25          | 5 |
-         | E45 2    | gb      | 23          | 5 |
-         | Y45      | gb      | 21          | 5 |
+         | postcode | country_code | rank_search | rank_address |
+         | E45 2CD  | gb           | 25          | 5 |
+         | E45 2    | gb           | 23          | 5 |
+         | Y45      | gb           | 21          | 5 |
 
-    Scenario: Postcodes outside all countries are not added to the postcode and word table
+    Scenario: Postcodes outside all countries are not added to the postcode table
         Given the places
             | osm | class | type  | addr+postcode | addr+housenumber | addr+place  | geometry  |
             | N34 | place | house | 01982         | 111              | Null Island | 0 0.00001 |
@@ -204,9 +201,8 @@ Feature: Import of postcodes
             | N1  | place | hamlet | Null Island | 0 0      |
         When importing
         Then location_postcode contains exactly
-            | country | postcode | geometry |
-        And there are no word tokens for postcodes 01982
-        When sending search query "111, 01982 Null Island"
-        Then results contain
-            | osm | display_name |
-            | N34 | 111, Null Island, 01982 |
+            | place_id |
+        When geocoding "111, 01982 Null Island"
+        Then the result set contains
+            | object | display_name |
+            | N34    | 111, Null Island, 01982 |
diff --git a/test/bdd/db/import/rank_computation.feature b/test/bdd/features/db/import/rank_computation.feature
similarity index 91%
rename from test/bdd/db/import/rank_computation.feature
rename to test/bdd/features/db/import/rank_computation.feature
index df01fd91..de123a56 100644
--- a/test/bdd/db/import/rank_computation.feature
+++ b/test/bdd/features/db/import/rank_computation.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Rank assignment
     Tests for assignment of search and address ranks.
 
@@ -173,13 +172,9 @@ Feature: Rank assignment
           | R23    | 20          | 0  |
           | R21    | 18          | 0  |
           | R22    | 16          | 16 |
-        Then place_addressline contains
+        Then place_addressline contains exactly
             | object | address | cached_rank_address |
             | N20    | R22     | 16                  |
-        Then place_addressline doesn't contain
-            | object | address |
-            | N20    | R21     |
-            | N20    | R23     |
 
     Scenario: adjacent admin_levels are considered different objects when they have different wikidata
         Given the named places
@@ -267,3 +262,34 @@ Feature: Rank assignment
           | object      | rank_search | rank_address |
           | N23:amenity | 30          | 30           |
           | N23:place   | 16          | 16           |
+
+    Scenario: Address rank 25 is only used for addr:place
+        Given the grid
+           | 10 | 33 | 34 | 11 |
+        Given the places
+          | osm | class | type    | name |
+          | N10 | place | village | vil  |
+          | N11 | place | farm    | farm |
+        And the places
+          | osm | class   | type        | name | geometry |
+          | W1  | highway | residential | RD   | 33,11    |
+        And the places
+          | osm | class   | type        | name | addr+farm | geometry |
+          | W2  | highway | residential | RD2  | farm       | 34,11    |
+        And the places
+          | osm | class | type  | housenr |
+          | N33 | place | house | 23      |
+        And the places
+          | osm | class | type  | housenr | addr+place |
+          | N34 | place | house | 23      | farm       |
+        When importing
+        Then placex contains
+          | object | parent_place_id |
+          | N11    | N10             |
+          | N33    | W1              |
+          | N34    | N11             |
+        And place_addressline contains
+          | object | address |
+          | W1     | N10     |
+          | W2     | N10     |
+          | W2     | N11     |
diff --git a/test/bdd/db/import/search_name.feature b/test/bdd/features/db/import/search_name.feature
similarity index 50%
rename from test/bdd/db/import/search_name.feature
rename to test/bdd/features/db/import/search_name.feature
index cd581c46..29b0f0bf 100644
--- a/test/bdd/db/import/search_name.feature
+++ b/test/bdd/features/db/import/search_name.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Creation of search terms
     Tests that search_name table is filled correctly
 
@@ -6,43 +5,40 @@ Feature: Creation of search terms
         Given the places
          | osm | class   | type | name+alt_name |
          | N1  | place   | city | New York; Big Apple |
+         | N2  | place   | town | New York Big Apple |
         When importing
-        Then search_name contains
-         | object | name_vector |
-         | N1     | #New York, #Big Apple |
+        And geocoding "New York Big Apple"
+        Then result 0 contains
+         | object |
+         | N2     |
 
     Scenario: Comma-separated names appear as a single full name
         Given the places
-         | osm | class   | type | name+alt_name |
+         | osm | class   | type | name+name |
          | N1  | place   | city | New York, Big Apple |
+         | N2  | place   | town | New York Big Apple |
         When importing
-        Then search_name contains
-         | object | name_vector |
-         | N1     | #New York Big Apple |
+        And geocoding "New York Big Apple"
+        Then result 0 contains
+         | object |
+         | N1     |
 
     Scenario: Name parts before brackets appear as full names
         Given the places
          | osm | class   | type | name+name |
          | N1  | place   | city | Halle (Saale) |
+         | N2  | place   | town | Halle |
         When importing
-        Then search_name contains
-         | object | name_vector |
-         | N1     | #Halle Saale, #Halle |
+        And geocoding "Halle"
+        Then result 0 contains
+         | object |
+         | N1     |
+        When geocoding "Halle (Saale)"
+        Then the result set contains
+         | object |
+         | N1 |
 
-    Scenario: Unnamed POIs have no search entry
-        Given the grid
-         |    | 1 |  |    |
-         | 10 |   |  | 11 |
-        And the places
-         | osm | class   | type        |
-         | N1  | place   | house       |
-        And the named places
-         | osm | class   | type        | geometry |
-         | W1  | highway | residential | 10,11    |
-        When importing
-        Then search_name has no entry for N1
-
-    Scenario: Unnamed POI has a search entry when it has unknown addr: tags
+    Scenario: Unknown addr: tags can be found for unnamed POIs
         Given the grid
          |    | 1 |  |    |
          | 10 |   |  | 11 |
@@ -53,21 +49,18 @@ Feature: Creation of search terms
          | osm | class   | type        | name+name   | geometry |
          | W1  | highway | residential | Rose Street | 10,11    |
         When importing
-        Then search_name contains
-         | object | nameaddress_vector |
-         | N1     | #Rose Street, Walltown |
-        When sending search query "23 Rose Street, Walltown"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
-        When sending search query "Walltown, Rose Street 23"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
-        When sending search query "Rose Street 23, Walltown"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
+        When geocoding "23 Rose Street, Walltown"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
+        When geocoding "Walltown, Rose Street 23"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
+        When geocoding "Rose Street 23, Walltown"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
 
     Scenario: Searching for unknown addr: tags also works for multiple words
         Given the grid
@@ -80,23 +73,20 @@ Feature: Creation of search terms
          | osm | class   | type        | name+name   | geometry |
          | W1  | highway | residential | Rose Street | 10,11    |
         When importing
-        Then search_name contains
-         | object | nameaddress_vector |
-         | N1     | #Rose Street, rose, Little, Big, Town |
-        When sending search query "23 Rose Street, Little Big Town"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
-        When sending search query "Rose Street 23, Little Big Town"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
-        When sending search query "Little big Town, Rose Street 23"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
+        When geocoding "23 Rose Street, Little Big Town"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
+        When geocoding "Rose Street 23, Little Big Town"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
+        When geocoding "Little big Town, Rose Street 23"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
 
-     Scenario: Unnamed POI has no search entry when it has known addr: tags
+     Scenario: Unnamed POI can be found when it has known addr: tags
         Given the grid
          |    | 1 |  |    |
          | 10 |   |  | 11 |
@@ -107,24 +97,10 @@ Feature: Creation of search terms
          | osm | class   | type        | name+name   | addr+city | geometry |
          | W1  | highway | residential | Rose Street | Walltown  | 10,11    |
         When importing
-        Then search_name has no entry for N1
-        When sending search query "23 Rose Street, Walltown"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
-
-    Scenario: Unnamed POI must have a house number to get a search entry
-        Given the grid
-         |    | 1 |  |    |
-         | 10 |   |  | 11 |
-        And the places
-         | osm | class   | type   | addr+city |
-         | N1  | place   | house  | Walltown  |
-        And the places
-         | osm | class   | type        | name+name   | geometry |
-         | W1  | highway | residential | Rose Street | 10,11    |
-        When importing
-        Then search_name has no entry for N1
+        When geocoding "23 Rose Street, Walltown"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
 
     Scenario: Unnamed POIs inherit parent name when unknown addr:place is present
         Given the grid
@@ -142,23 +118,22 @@ Feature: Creation of search terms
         Then placex contains
          | object | parent_place_id |
          | N1     | R1              |
-        When sending search query "23 Rose Street"
-        Then exactly 1 results are returned
-        And results contain
-         | osm | display_name |
-         | W1  | Rose Street, Strange Town |
-        When sending search query "23 Walltown, Strange Town"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Walltown, Strange Town |
-        When sending search query "Walltown 23, Strange Town"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Walltown, Strange Town |
-        When sending search query "Strange Town, Walltown 23"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Walltown, Strange Town |
+        When geocoding "23 Rose Street"
+        Then all results contain
+         | object | display_name |
+         | W1     | Rose Street, Strange Town |
+        When geocoding "23 Walltown, Strange Town"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Walltown, Strange Town |
+        When geocoding "Walltown 23, Strange Town"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Walltown, Strange Town |
+        When geocoding "Strange Town, Walltown 23"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Walltown, Strange Town |
 
     Scenario: Named POIs can be searched by housenumber when unknown addr:place is present
         Given the grid
@@ -173,26 +148,26 @@ Feature: Creation of search terms
          | W1  | highway | residential | Rose Street  | 10,11 |
          | R1  | place   | city        | Strange Town | (100,101,102,103,100) |
         When importing
-        When sending search query "23 Walltown, Strange Town"
-        Then results contain
-         | osm | display_name |
-         | N1  | Blue house, 23, Walltown, Strange Town |
-        When sending search query "Walltown 23, Strange Town"
-        Then results contain
-         | osm | display_name |
-         | N1  | Blue house, 23, Walltown, Strange Town |
-        When sending search query "Strange Town, Walltown 23"
-        Then results contain
-         | osm | display_name |
-         | N1  | Blue house, 23, Walltown, Strange Town |
-        When sending search query "Strange Town, Walltown 23, Blue house"
-        Then results contain
-         | osm | display_name |
-         | N1  | Blue house, 23, Walltown, Strange Town |
-        When sending search query "Strange Town, Walltown, Blue house"
-        Then results contain
-         | osm | display_name |
-         | N1  | Blue house, 23, Walltown, Strange Town |
+        When geocoding "23 Walltown, Strange Town"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Blue house, 23, Walltown, Strange Town |
+        When geocoding "Walltown 23, Strange Town"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Blue house, 23, Walltown, Strange Town |
+        When geocoding "Strange Town, Walltown 23"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Blue house, 23, Walltown, Strange Town |
+        When geocoding "Strange Town, Walltown 23, Blue house"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Blue house, 23, Walltown, Strange Town |
+        When geocoding "Strange Town, Walltown, Blue house"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Blue house, 23, Walltown, Strange Town |
 
     Scenario: Named POIs can be found when unknown multi-word addr:place is present
         Given the grid
@@ -207,14 +182,14 @@ Feature: Creation of search terms
          | W1  | highway | residential | Rose Street  | 10,11    |
          | R1  | place   | city        | Strange Town | (100,101,102,103,100) |
         When importing
-        When sending search query "23 Moon Sun, Strange Town"
-        Then results contain
-         | osm | display_name |
-         | N1  | Blue house, 23, Moon sun, Strange Town |
-        When sending search query "Blue house, Moon Sun, Strange Town"
-        Then results contain
-         | osm | display_name |
-         | N1  | Blue house, 23, Moon sun, Strange Town |
+        When geocoding "23 Moon Sun, Strange Town"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Blue house, 23, Moon sun, Strange Town |
+        When geocoding "Blue house, Moon Sun, Strange Town"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Blue house, 23, Moon sun, Strange Town |
 
     Scenario: Unnamed POIs doesn't inherit parent name when addr:place is present only in parent address
         Given the grid
@@ -229,16 +204,14 @@ Feature: Creation of search terms
          | W1  | highway | residential | Rose Street  | Walltown  | 10,11    |
          | R1  | place   | suburb      | Strange Town | Walltown  | (100,101,102,103,100) |
         When importing
-        When sending search query "23 Rose Street, Walltown"
-        Then exactly 1 result is returned
-        And results contain
-         | osm | display_name |
-         | W1  | Rose Street, Strange Town |
-        When sending search query "23  Walltown"
-        Then exactly 1 result is returned
-        And results contain
-         | osm | display_name |
-         | N1  | 23, Walltown, Strange Town |
+        When geocoding "23 Rose Street, Walltown"
+        Then all results contain
+         | object | display_name |
+         | W1     | Rose Street, Strange Town |
+        When geocoding "23  Walltown"
+        Then all results contain
+         | object | display_name |
+         | N1     | 23, Walltown, Strange Town |
 
     Scenario: Unnamed POIs does inherit parent name when unknown addr:place and addr:street is present
         Given the grid
@@ -251,12 +224,11 @@ Feature: Creation of search terms
          | osm | class   | type        | name+name   | geometry |
          | W1  | highway | residential | Rose Street | 10,11    |
         When importing
-        Then search_name has no entry for N1
-        When sending search query "23 Rose Street"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
-        When sending search query "23 Lily Street"
+        When geocoding "23 Rose Street"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
+        When geocoding "23 Lily Street"
         Then exactly 0 results are returned
 
     Scenario: An unknown addr:street is ignored
@@ -270,15 +242,14 @@ Feature: Creation of search terms
          | osm | class   | type        | name+name   | geometry |
          | W1  | highway | residential | Rose Street | 10,11    |
         When importing
-        Then search_name has no entry for N1
-        When sending search query "23 Rose Street"
-        Then results contain
-         | osm | display_name |
-         | N1  | 23, Rose Street |
-        When sending search query "23 Lily Street"
+        When geocoding "23 Rose Street"
+        Then the result set contains
+         | object | display_name |
+         | N1     | 23, Rose Street |
+        When geocoding "23 Lily Street"
         Then exactly 0 results are returned
 
-    Scenario: Named POIs get unknown address tags added in the search_name table
+    Scenario: Named POIs can be found through unknown address tags
         Given the grid
          |    | 1 |  |    |
          | 10 |   |  | 11 |
@@ -289,29 +260,26 @@ Feature: Creation of search terms
          | osm | class   | type        | name+name   | geometry |
          | W1  | highway | residential | Rose Street | 10,11    |
         When importing
-        Then search_name contains
-         | object | name_vector | nameaddress_vector |
-         | N1     | #Green Moss | #Rose Street, Walltown |
-        When sending search query "Green Moss, Rose Street, Walltown"
-        Then results contain
-         | osm | display_name |
-         | N1  | Green Moss, 26, Rose Street |
-        When sending search query "Green Moss, 26, Rose Street, Walltown"
-        Then results contain
-         | osm | display_name |
-         | N1  | Green Moss, 26, Rose Street |
-        When sending search query "26, Rose Street, Walltown"
-        Then results contain
-         | osm | display_name |
-         | N1  | Green Moss, 26, Rose Street |
-        When sending search query "Rose Street 26, Walltown"
-        Then results contain
-         | osm | display_name |
-         | N1  | Green Moss, 26, Rose Street |
-        When sending search query "Walltown, Rose Street 26"
-        Then results contain
-         | osm | display_name |
-         | N1  | Green Moss, 26, Rose Street |
+        When geocoding "Green Moss, Rose Street, Walltown"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Green Moss, 26, Rose Street |
+        When geocoding "Green Moss, 26, Rose Street, Walltown"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Green Moss, 26, Rose Street |
+        When geocoding "26, Rose Street, Walltown"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Green Moss, 26, Rose Street |
+        When geocoding "Rose Street 26, Walltown"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Green Moss, 26, Rose Street |
+        When geocoding "Walltown, Rose Street 26"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Green Moss, 26, Rose Street |
 
     Scenario: Named POI doesn't inherit parent name when addr:place is present only in parent address
         Given the grid
@@ -326,12 +294,12 @@ Feature: Creation of search terms
          | W1  | highway | residential | Rose Street  | 10,11    |
          | R1  | place   | suburb      | Strange Town | (100,101,102,103,100) |
         When importing
-        When sending search query "Green Moss, Rose Street, Walltown"
-        Then exactly 0 result is returned
-        When sending search query "Green Moss, Walltown"
-        Then results contain
-         | osm | display_name |
-         | N1  | Green Moss, Walltown, Strange Town |
+        When geocoding "Green Moss, Rose Street, Walltown"
+        Then exactly 0 results are returned
+        When geocoding "Green Moss, Walltown"
+        Then the result set contains
+         | object | display_name |
+         | N1     | Green Moss, Walltown, Strange Town |
 
     Scenario: Named POIs inherit address from parent
         Given the grid
@@ -342,9 +310,10 @@ Feature: Creation of search terms
          | N1  | place   | house       | foo      | 1        |
          | W1  | highway | residential | the road | 10,11    |
         When importing
-        Then search_name contains
-         | object | name_vector | nameaddress_vector |
-         | N1     | foo         | #the road |
+        When geocoding "foo, the road"
+        Then all results contain
+         | object |
+         | N1     |
 
     Scenario: Some addr: tags are added to address
         Given the grid
@@ -354,13 +323,14 @@ Feature: Creation of search terms
          | osm | class   | type        | name     |
          | N2  | place   | city        | bonn     |
          | N3  | place   | suburb      | smalltown|
-        And the named places
-         | osm | class   | type    | addr+city | addr+municipality | addr+suburb | geometry |
-         | W1  | highway | service | bonn      | New York          | Smalltown   | 10,11    |
+        And the places
+         | osm | class   | type    | name    | addr+city | addr+municipality | addr+suburb | geometry |
+         | W1  | highway | service | the end | bonn      | New York          | Smalltown   | 10,11    |
         When importing
-        Then search_name contains
-         | object | nameaddress_vector |
-         | W1     | bonn, new, york, smalltown |
+        When geocoding "the end, new york, bonn, smalltown"
+        Then all results contain
+         | object |
+         | W1     |
 
     Scenario: A known addr:* tag is added even if the name is unknown
         Given the grid
@@ -369,36 +339,22 @@ Feature: Creation of search terms
          | osm | class   | type        | name | addr+city | geometry |
          | W1  | highway | residential | Road | Nandu     | 10,11    |
         When importing
-        Then search_name contains
-         | object | nameaddress_vector |
-         | W1     | nandu |
-
-    Scenario: addr:postcode is not added to the address terms
-        Given the grid with origin DE
-         |    | 1 |  |    |
-         | 10 |   |  | 11 |
-        And the places
-         | osm | class   | type        | name+ref  |
-         | N1  | place   | state       | 12345     |
-        And the named places
-         | osm | class   | type        | addr+postcode | geometry |
-         | W1  | highway | residential | 12345         | 10,11    |
-        When importing
-        Then search_name contains not
-         | object | nameaddress_vector |
-         | W1     | 12345 |
+        And geocoding "Road, Nandu"
+        Then all results contain
+         | object |
+         | W1     |
 
     Scenario: a linked place does not show up in search name
         Given the 0.01 grid
          | 10 |   | 11 |
          |    | 2 |    |
          | 13 |   | 12 |
-        Given the named places
-         | osm  | class    | type           | admin | geometry |
-         | R13  | boundary | administrative | 9     | (10,11,12,13,10) |
-        And the named places
-         | osm  | class    | type           |
-         | N2   | place    | city           |
+        Given the places
+         | osm  | class    | type           | name | admin | geometry |
+         | R13  | boundary | administrative | Roma | 9     | (10,11,12,13,10) |
+        And the places
+         | osm  | class    | type           | name |
+         | N2   | place    | city           | Cite |
         And the relations
          | id | members       | tags+type |
          | 13 | N2:label      | boundary |
@@ -406,7 +362,10 @@ Feature: Creation of search terms
         Then placex contains
          | object | linked_place_id |
          | N2     | R13             |
-        And search_name has no entry for N2
+        When geocoding "Cite"
+        Then all results contain
+         | object |
+         | R13 |
 
     Scenario: a linked waterway does not show up in search name
         Given the grid
@@ -424,5 +383,7 @@ Feature: Creation of search terms
          | object | linked_place_id |
          | W1     | R13 |
          | W2     | R13 |
-        And search_name has no entry for W1
-        And search_name has no entry for W2
+        When geocoding "Rhein"
+        Then all results contain
+         | object |
+         | R13 |
diff --git a/test/bdd/db/query/housenumbers.feature b/test/bdd/features/db/query/housenumbers.feature
similarity index 64%
rename from test/bdd/db/query/housenumbers.feature
rename to test/bdd/features/db/query/housenumbers.feature
index 16d9fd5a..6ed6284b 100644
--- a/test/bdd/db/query/housenumbers.feature
+++ b/test/bdd/features/db/query/housenumbers.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Searching of house numbers
     Test for specialised treeatment of housenumbers
 
@@ -17,13 +16,13 @@ Feature: Searching of house numbers
          | osm | class   | type | name       | geometry |
          | W10 | highway | path | North Road | 1,2,3    |
         When importing
-        And sending search query "45, North Road"
-        Then results contain
-         | osm |
+        And geocoding "45, North Road"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "North Road 45"
-        Then results contain
-         | osm |
+        When geocoding "North Road 45"
+        Then the result set contains
+         | object |
          | N1  |
 
 
@@ -35,17 +34,17 @@ Feature: Searching of house numbers
          | osm | class   | type | name       | geometry |
          | W10 | highway | path | North Road | 1,2,3    |
         When importing
-        And sending search query "45, North Road"
-        Then results contain
-         | osm |
+        And geocoding "45, North Road"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "North Road â£â¤"
-        Then results contain
-         | osm |
+        When geocoding "North Road â£â¤"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "North Road ðªð«"
-        Then results contain
-         | osm |
+        When geocoding "North Road ðªð«"
+        Then the result set contains
+         | object |
          | N1  |
 
     Examples:
@@ -63,17 +62,17 @@ Feature: Searching of house numbers
          | osm | class   | type | name     | geometry |
          | W10 | highway | path | Multistr | 1,2,3    |
         When importing
-        When sending search query "2 Multistr"
-        Then results contain
-         | osm |
+        When geocoding "2 Multistr"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "4 Multistr"
-        Then results contain
-         | osm |
+        When geocoding "4 Multistr"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "12 Multistr"
-        Then results contain
-         | osm |
+        When geocoding "12 Multistr"
+        Then the result set contains
+         | object |
          | N1  |
 
      Examples:
@@ -91,21 +90,21 @@ Feature: Searching of house numbers
          | osm | class   | type | name     | geometry |
          | W10 | highway | path | Multistr | 1,2,3    |
         When importing
-        When sending search query "2A Multistr"
-        Then results contain
-         | osm |
+        When geocoding "2A Multistr"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "2 a Multistr"
-        Then results contain
-         | osm |
+        When geocoding "2 a Multistr"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "2-A Multistr"
-        Then results contain
-         | osm |
+        When geocoding "2-A Multistr"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "Multistr 2 A"
-        Then results contain
-         | osm |
+        When geocoding "Multistr 2 A"
+        Then the result set contains
+         | object |
          | N1  |
 
     Examples:
@@ -124,21 +123,21 @@ Feature: Searching of house numbers
          | osm | class   | type | name       | geometry |
          | W10 | highway | path | Chester St | 1,2,3    |
         When importing
-        When sending search query "34-10 Chester St"
-        Then results contain
-         | osm |
+        When geocoding "34-10 Chester St"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "34/10 Chester St"
-        Then results contain
-         | osm |
+        When geocoding "34/10 Chester St"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "34 10 Chester St"
-        Then results contain
-         | osm |
+        When geocoding "34 10 Chester St"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "3410 Chester St"
-        Then results contain
-         | osm |
+        When geocoding "3410 Chester St"
+        Then the result set contains
+         | object |
          | W10 |
 
     Examples:
@@ -156,21 +155,21 @@ Feature: Searching of house numbers
          | osm | class   | type | name       | geometry |
          | W10 | highway | path | Rue Paris | 1,2,3    |
         When importing
-        When sending search query "Rue Paris 45bis"
-        Then results contain
-         | osm |
+        When geocoding "Rue Paris 45bis"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "Rue Paris 45 BIS"
-        Then results contain
-         | osm |
+        When geocoding "Rue Paris 45 BIS"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "Rue Paris 45BIS"
-        Then results contain
-         | osm |
+        When geocoding "Rue Paris 45BIS"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "Rue Paris 45 bis"
-        Then results contain
-         | osm |
+        When geocoding "Rue Paris 45 bis"
+        Then the result set contains
+         | object |
          | N1  |
 
     Examples:
@@ -189,21 +188,21 @@ Feature: Searching of house numbers
          | osm | class   | type | name       | geometry |
          | W10 | highway | path | Rue du Berger | 1,2,3    |
         When importing
-        When sending search query "Rue du Berger 45ter"
-        Then results contain
-         | osm |
+        When geocoding "Rue du Berger 45ter"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "Rue du Berger 45 TER"
-        Then results contain
-         | osm |
+        When geocoding "Rue du Berger 45 TER"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "Rue du Berger 45TER"
-        Then results contain
-         | osm |
+        When geocoding "Rue du Berger 45TER"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "Rue du Berger 45 ter"
-        Then results contain
-         | osm |
+        When geocoding "Rue du Berger 45 ter"
+        Then the result set contains
+         | object |
          | N1  |
 
     Examples:
@@ -222,21 +221,21 @@ Feature: Searching of house numbers
          | osm | class   | type | name       | geometry |
          | W10 | highway | path | Herengracht | 1,2,3    |
         When importing
-        When sending search query "501-H 1 Herengracht"
-        Then results contain
-         | osm |
+        When geocoding "501-H 1 Herengracht"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "501H-1 Herengracht"
-        Then results contain
-         | osm |
+        When geocoding "501H-1 Herengracht"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "501H1 Herengracht"
-        Then results contain
-         | osm |
+        When geocoding "501H1 Herengracht"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "501-H1 Herengracht"
-        Then results contain
-         | osm |
+        When geocoding "501-H1 Herengracht"
+        Then the result set contains
+         | object |
          | N1  |
 
     Examples:
@@ -255,17 +254,17 @@ Feature: Searching of house numbers
          | osm | class   | type | name       | geometry |
          | W10 | highway | path | ÐÐ¾Ð»ÑÐ±Ð¸Ð½ÑÐºÐ°Ñ ÑÐ»Ð¸ÑÐ° | 1,2,3    |
         When importing
-        When sending search query "ÐÐ¾Ð»ÑÐ±Ð¸Ð½ÑÐºÐ°Ñ ÑÐ»Ð¸ÑÐ° 55Ðº3"
-        Then results contain
-         | osm |
+        When geocoding "ÐÐ¾Ð»ÑÐ±Ð¸Ð½ÑÐºÐ°Ñ ÑÐ»Ð¸ÑÐ° 55Ðº3"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "ÐÐ¾Ð»ÑÐ±Ð¸Ð½ÑÐºÐ°Ñ ÑÐ»Ð¸ÑÐ° 55 k3"
-        Then results contain
-         | osm |
+        When geocoding "ÐÐ¾Ð»ÑÐ±Ð¸Ð½ÑÐºÐ°Ñ ÑÐ»Ð¸ÑÐ° 55 k3"
+        Then the result set contains
+         | object |
          | N1  |
-        When sending search query "ÐÐ¾Ð»ÑÐ±Ð¸Ð½ÑÐºÐ°Ñ ÑÐ»Ð¸ÑÐ° 55 Ðº-3"
-        Then results contain
-         | osm |
+        When geocoding "ÐÐ¾Ð»ÑÐ±Ð¸Ð½ÑÐºÐ°Ñ ÑÐ»Ð¸ÑÐ° 55 Ðº-3"
+        Then the result set contains
+         | object |
          | N1  |
 
     Examples:
@@ -282,9 +281,9 @@ Feature: Searching of house numbers
          | osm | class   | type | name       | geometry |
          | W10 | highway | path | Chester St | 1,2,3    |
         When importing
-        When sending search query "Chester St Warring"
-        Then results contain
-         | osm |
+        When geocoding "Chester St Warring"
+        Then the result set contains
+         | object |
          | N1  |
 
 
@@ -311,11 +310,11 @@ Feature: Searching of house numbers
          | 10 | 10, 11 |
          | 20 | 20, 21 |
         When importing
-        When sending search query "Ringstr 12"
-        Then results contain
-         | osm |
+        When geocoding "Ringstr 12"
+        Then the result set contains
+         | object |
          | W10 |
-        When sending search query "Ringstr 13"
-        Then results contain
-         | osm |
+        When geocoding "Ringstr 13"
+        Then the result set contains
+         | object |
          | W20 |
diff --git a/test/bdd/db/query/interpolation.feature b/test/bdd/features/db/query/interpolation.feature
similarity index 72%
rename from test/bdd/db/query/interpolation.feature
rename to test/bdd/features/db/query/interpolation.feature
index 600de718..1746d37d 100644
--- a/test/bdd/db/query/interpolation.feature
+++ b/test/bdd/features/db/query/interpolation.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Query of address interpolations
     Tests that interpolated addresses can be queried correctly
 
@@ -23,14 +22,14 @@ Feature: Query of address interpolations
           | id | nodes |
           | 1  | 1,3   |
         When importing
-        When sending v1/reverse N2
-        Then results contain
-          | ID | display_name |
-          | 0  | 3, Nickway   |
-        When sending search query "Nickway 3"
-        Then results contain
-          | osm | display_name |
-          | W1  | 3, Nickway   |
+        When reverse geocoding at node 2
+        Then the result contains
+          | display_name |
+          | 3, Nickway   |
+        When geocoding "Nickway 3"
+        Then all results contain
+          | object | display_name |
+          | W1     | 3, Nickway   |
 
 
     Scenario: Find interpolations with multiple numbers
@@ -48,11 +47,11 @@ Feature: Query of address interpolations
           | id | nodes |
           | 1  | 1,3   |
         When importing
-        When sending v1/reverse N2
-        Then results contain
-          | ID | display_name | centroid |
-          | 0  | 10, Nickway  | 2 |
-        When sending search query "Nickway 10"
-        Then results contain
-          | osm | display_name  | centroid |
-          | W1  | 10, Nickway   | 2 |
+        When reverse geocoding at node 2
+        Then the result contains
+          | display_name | centroid!wkt |
+          | 10, Nickway  | 2 |
+        When geocoding "Nickway 10"
+        Then all results contain
+          | object | display_name  | centroid!wkt |
+          | W1     | 10, Nickway   | 2 |
diff --git a/test/bdd/db/query/japanese.feature b/test/bdd/features/db/query/japanese.feature
similarity index 92%
rename from test/bdd/db/query/japanese.feature
rename to test/bdd/features/db/query/japanese.feature
index f21e0f5c..4fad118c 100644
--- a/test/bdd/db/query/japanese.feature
+++ b/test/bdd/features/db/query/japanese.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Searches in Japan
     Test specifically for searches of Japanese addresses and in Japanese language.
     Scenario: A block house-number is parented to the neighbourhood
@@ -23,7 +22,7 @@ Feature: Searches in Japan
         Then placex contains
           | object | parent_place_id |
           | N3     | N9              |
-        When sending search query "2ä¸ç® 6-2"
-        Then results contain
-          | osm |
+        When geocoding "2ä¸ç® 6-2"
+        Then all results contain
+          | object |
           | N3  |
diff --git a/test/bdd/db/query/linking.feature b/test/bdd/features/db/query/linking.feature
similarity index 72%
rename from test/bdd/db/query/linking.feature
rename to test/bdd/features/db/query/linking.feature
index 351f8871..8e6ab4d1 100644
--- a/test/bdd/db/query/linking.feature
+++ b/test/bdd/features/db/query/linking.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Searching linked places
     Tests that information from linked places can be searched correctly
 
@@ -20,18 +19,18 @@ Feature: Searching linked places
         Then placex contains
          | object  | linked_place_id |
          | N2      | R13 |
-        When sending search query "Vario"
+        When geocoding "Vario"
          | namedetails |
          | 1 |
-        Then results contain
-         | osm | display_name | namedetails |
-         | R13 | Garbo | "name": "Garbo", "name:it": "Vario" |
-        When sending search query "Vario"
+        Then all results contain
+         | object | display_name | namedetails!dict |
+         | R13    | Garbo | "name": "Garbo", "name:it": "Vario" |
+        When geocoding "Vario"
          | accept-language |
          | it |
-        Then results contain
-         | osm | display_name |
-         | R13 | Vario |
+        Then all results contain
+         | object | display_name |
+         | R13    | Vario |
 
 
     Scenario: Differing names from linked places are searchable
@@ -52,13 +51,13 @@ Feature: Searching linked places
         Then placex contains
          | object  | linked_place_id |
          | N2      | R13 |
-        When sending search query "Vario"
+        When geocoding "Vario"
          | namedetails |
          | 1 |
-        Then results contain
-         | osm | display_name | namedetails |
-         | R13 | Garbo        | "name": "Garbo", "_place_name": "Vario" |
-        When sending search query "Garbo"
-        Then results contain
-         | osm | display_name |
-         | R13 | Garbo |
+        Then all results contain
+         | object | display_name | namedetails!dict |
+         | R13    | Garbo        | "name": "Garbo", "_place_name": "Vario" |
+        When geocoding "Garbo"
+        Then all results contain
+         | object | display_name |
+         | R13    | Garbo |
diff --git a/test/bdd/features/db/query/normalization.feature b/test/bdd/features/db/query/normalization.feature
new file mode 100644
index 00000000..f884be6b
--- /dev/null
+++ b/test/bdd/features/db/query/normalization.feature
@@ -0,0 +1,225 @@
+Feature: Import and search of names
+    Tests all naming related issues: normalisation,
+    abbreviations, internationalisation, etc.
+
+    Scenario: non-latin scripts can be found
+        Given the places
+          | osm | class | type      | name |
+          | N1  | place | locality  | Ð ÐµÑÐ¸ÑÐºÐ¸Ð¹ ÑÐ°Ð¹Ð¾Ð½ |
+          | N2  | place | locality  | Refugio de montaÃ±a |
+          | N3  | place | locality  | é«æ§»å¸|
+          | N4  | place | locality  | Ø§ÙØ¯ÙØ­Ø© |
+        When importing
+        When geocoding "Ð ÐµÑÐ¸ÑÐºÐ¸Ð¹ ÑÐ°Ð¹Ð¾Ð½"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "Refugio de montaÃ±a"
+        Then result 0 contains
+         | object |
+         | N2 |
+        When geocoding "é«æ§»å¸"
+        Then result 0 contains
+         | object |
+         | N3 |
+        When geocoding "Ø§ÙØ¯ÙØ­Ø©"
+        Then result 0 contains
+         | object |
+         | N4 |
+
+    Scenario: Case-insensitivity of search
+        Given the places
+          | osm | class | type      | name |
+          | N1  | place | locality  | FooBar |
+        When importing
+        Then placex contains
+          | object | class  | type     | name+name |
+          | N1     | place  | locality | FooBar |
+        When geocoding "FooBar"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "foobar"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "fOObar"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "FOOBAR"
+        Then result 0 contains
+         | object |
+         | N1 |
+
+    Scenario: Multiple spaces in name
+        Given the places
+          | osm | class | type      | name |
+          | N1  | place | locality  | one two  three |
+        When importing
+        When geocoding "one two three"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "one   two three"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "one two  three"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "    one two three"
+        Then result 0 contains
+         | object |
+         | N1 |
+
+    Scenario: Special characters in name
+        Given the places
+          | osm | class | type      | name+name:de |
+          | N1  | place | locality  | Jim-Knopf-StraÃe |
+          | N2  | place | locality  | Smith/Weston |
+          | N3  | place | locality  | space mountain |
+          | N4  | place | locality  | space |
+          | N5  | place | locality  | mountain |
+        When importing
+        When geocoding "Jim-Knopf-Str"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "Jim Knopf-Str"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "Jim Knopf Str"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "Jim/Knopf-Str"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "Jim-Knopfstr"
+        Then result 0 contains
+         | object |
+         | N1 |
+        When geocoding "Smith/Weston"
+        Then result 0 contains
+         | object |
+         | N2 |
+        When geocoding "Smith Weston"
+        Then result 0 contains
+         | object |
+         | N2 |
+        When geocoding "Smith-Weston"
+        Then result 0 contains
+         | object |
+         | N2 |
+        When geocoding "space mountain"
+        Then result 0 contains
+         | object |
+         | N3 |
+        When geocoding "space-mountain"
+        Then result 0 contains
+         | object |
+         | N3 |
+        When geocoding "space/mountain"
+        Then result 0 contains
+         | object |
+         | N3 |
+        When geocoding "space\mountain"
+        Then result 0 contains
+         | object |
+         | N3 |
+        When geocoding "space(mountain)"
+        Then result 0 contains
+         | object |
+         | N3 |
+
+    Scenario: Landuse with name are found
+        Given the grid
+          | 1 | 2 |
+          | 3 |   |
+        Given the places
+          | osm | class    | type        | name     | geometry |
+          | R1  | natural  | meadow      | landuse1 | (1,2,3,1) |
+          | R2  | landuse  | industrial  | landuse2 | (2,3,1,2) |
+        When importing
+        When geocoding "landuse1"
+        Then result 0 contains
+         | object |
+         | R1 |
+        When geocoding "landuse2"
+        Then result 0 contains
+         | object |
+         | R2 |
+
+    Scenario: Postcode boundaries without ref
+        Given the grid with origin FR
+          |   | 2 |   |
+          | 1 |   | 3 |
+        Given the places
+          | osm | class    | type        | postcode  | geometry |
+          | R1  | boundary | postal_code | 123-45    | (1,2,3,1) |
+        When importing
+        When geocoding "123-45"
+        Then result 0 contains
+         | object |
+         | R1 |
+
+    Scenario Outline: Housenumbers with special characters are found
+        Given the grid
+            | 1 |  |   |  | 2 |
+            |   |  | 9 |  |   |
+        And the places
+            | osm | class   | type    | name    | geometry |
+            | W1  | highway | primary | Main St | 1,2      |
+        And the places
+            | osm | class    | type | housenr | geometry |
+            | N1  | building | yes  | <nr>    | 9        |
+        When importing
+        And geocoding "Main St <nr>"
+        Then result 0 contains
+         | object | display_name |
+         | N1     | <nr>, Main St |
+
+    Examples:
+        | nr |
+        | 1  |
+        | 3456 |
+        | 1 a |
+        | 56b |
+        | 1 A |
+        | 2è |
+        | 1Ð  |
+        | 1 Ðº1 |
+        | 23-123 |
+
+    Scenario Outline: Housenumbers in lists are found
+        Given the grid
+            | 1 |  |   |  | 2 |
+            |   |  | 9 |  |   |
+        And the places
+            | osm | class   | type    | name    | geometry |
+            | W1  | highway | primary | Main St | 1,2      |
+        And the places
+            | osm | class    | type | housenr   | geometry |
+            | N1  | building | yes  | <nr-list> | 9        |
+        When importing
+        And geocoding "Main St <nr>"
+        Then result 0 contains
+         | object | display_name |
+         | N1     | <nr-list>, Main St |
+
+    Examples:
+        | nr-list    | nr |
+        | 1,2,3      | 1  |
+        | 1,2,3      | 2  |
+        | 1, 2, 3    | 3  |
+        | 45 ;67;3   | 45 |
+        | 45 ;67;3   | 67 |
+        | 1a;1k      | 1a |
+        | 1a;1k      | 1k |
+        | 34/678     | 34 |
+        | 34/678     | 678 |
+        | 34/678     | 34/678 |
diff --git a/test/bdd/db/query/postcodes.feature b/test/bdd/features/db/query/postcodes.feature
similarity index 64%
rename from test/bdd/db/query/postcodes.feature
rename to test/bdd/features/db/query/postcodes.feature
index e8a2ccc2..f5ffcd00 100644
--- a/test/bdd/db/query/postcodes.feature
+++ b/test/bdd/features/db/query/postcodes.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Querying fo postcode variants
 
     Scenario: Postcodes in Singapore (6-digit postcode)
@@ -8,10 +7,10 @@ Feature: Querying fo postcode variants
             | osm | class   | type | name   | addr+postcode | geometry |
             | W1  | highway | path | Lorang | 399174        | 10,11    |
         When importing
-        When sending search query "399174"
-        Then results contain
-            | ID | type     | display_name |
-            | 0  | postcode | 399174, Singapore |
+        When geocoding "399174"
+        Then result 0 contains
+            | type     | display_name |
+            | postcode | 399174, Singapore |
 
 
     Scenario Outline: Postcodes in the Netherlands (mixed postcode with spaces)
@@ -21,14 +20,14 @@ Feature: Querying fo postcode variants
             | osm | class   | type | name     | addr+postcode | geometry |
             | W1  | highway | path | De Weide | 3993 DX       | 10,11    |
         When importing
-        When sending search query "3993 DX"
-        Then results contain
-            | ID | type     | display_name |
-            | 0  | postcode | 3993 DX, Nederland      |
-        When sending search query "3993dx"
-        Then results contain
-            | ID | type     | display_name |
-            | 0  | postcode | 3993 DX, Nederland      |
+        When geocoding "3993 DX"
+        Then result 0 contains
+            | type     | display_name |
+            | postcode | 3993 DX, Nederland      |
+        When geocoding "3993dx"
+        Then result 0 contains
+            | type     | display_name |
+            | postcode | 3993 DX, Nederland      |
 
         Examples:
             | postcode |
@@ -44,10 +43,10 @@ Feature: Querying fo postcode variants
             | osm | class   | type | name   | addr+postcode | geometry |
             | W1  | highway | path | Lorang | 399174        | 10,11    |
         When importing
-        When sending search query "399174"
-        Then results contain
-            | ID | type     | display_name |
-            | 0  | postcode | 399174, Singapore       |
+        When geocoding "399174"
+        Then result 0 contains
+            | type     | display_name |
+            | postcode | 399174, Singapore       |
 
 
     Scenario Outline: Postcodes in Andorra (with country code)
@@ -57,14 +56,14 @@ Feature: Querying fo postcode variants
             | osm | class   | type | name   | addr+postcode | geometry |
             | W1  | highway | path | Lorang | <postcode>    | 10,11    |
         When importing
-        When sending search query "675"
-        Then results contain
-            | ID | type     | display_name |
-            | 0  | postcode | AD675, Andorra |
-        When sending search query "AD675"
-        Then results contain
-            | ID | type     | display_name |
-            | 0  | postcode | AD675, Andorra |
+        When geocoding "675"
+        Then result 0 contains
+            | type     | display_name |
+            | postcode | AD675, Andorra |
+        When geocoding "AD675"
+        Then result 0 contains
+            | type     | display_name |
+            | postcode | AD675, Andorra |
 
         Examples:
             | postcode |
@@ -80,15 +79,15 @@ Feature: Querying fo postcode variants
            | N35 | place | house | E4 7EA        | 111              | country:gb |
         When importing
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | gb      | EH4 7EA  | country:gb |
-           | gb      | E4 7EA   | country:gb |
-        When sending search query "EH4 7EA"
-        Then results contain
+           | country_code | postcode | geometry!wkt |
+           | gb           | EH4 7EA  | country:gb |
+           | gb           | E4 7EA   | country:gb |
+        When geocoding "EH4 7EA"
+        Then result 0 contains
            | type     | display_name |
            | postcode | EH4 7EA, United Kingdom |
-        When sending search query "E4 7EA"
-        Then results contain
+        When geocoding "E4 7EA"
+        Then result 0 contains
            | type     | display_name |
            | postcode | E4 7EA, United Kingdom |
 
@@ -102,9 +101,9 @@ Feature: Querying fo postcode variants
             | R23 | boundary | postal_code | 12345    | (1,2,3,4,1) |
         When importing
         Then location_postcode contains exactly
-          | country | postcode |
-          | de      | 12345    |
-        When sending search query "12345, de"
-        Then results contain
-          | osm |
+          | country_code | postcode |
+          | de           | 12345    |
+        When geocoding "12345, de"
+        Then result 0 contains
+          | object |
           | R23 |
diff --git a/test/bdd/db/query/reverse.feature b/test/bdd/features/db/query/reverse.feature
similarity index 72%
rename from test/bdd/db/query/reverse.feature
rename to test/bdd/features/db/query/reverse.feature
index 11ee8685..55c2162d 100644
--- a/test/bdd/db/query/reverse.feature
+++ b/test/bdd/features/db/query/reverse.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Reverse searches
     Test results of reverse queries
 
@@ -12,11 +11,11 @@ Feature: Reverse searches
           | W1  | aeroway | terminal   | (1,2,3,4,1) |
           | N1  | amenity | restaurant | 9           |
         When importing
-        And sending v1/reverse at 1.0001,1.0001
-        Then results contain
-         | osm |
+        And reverse geocoding 1.0001,1.0001
+        Then the result contains
+         | object |
          | N1  |
-        When sending v1/reverse at 1.0003,1.0001
-        Then results contain
-         | osm |
+        When reverse geocoding 1.0003,1.0001
+        Then the result contains
+         | object |
          | W1  |
diff --git a/test/bdd/db/query/search_simple.feature b/test/bdd/features/db/query/search_simple.feature
similarity index 61%
rename from test/bdd/db/query/search_simple.feature
rename to test/bdd/features/db/query/search_simple.feature
index 5fef3132..c46efec6 100644
--- a/test/bdd/db/query/search_simple.feature
+++ b/test/bdd/features/db/query/search_simple.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Searching of simple objects
     Testing simple stuff
 
@@ -7,32 +6,10 @@ Feature: Searching of simple objects
           | osm | class | type    | name+name | geometry   |
           | N1  | place | village | Foo       | 10.0 -10.0 |
         When importing
-        And sending search query "Foo"
-        Then results contain
-         | ID | osm | category | type    | centroid |
-         | 0  | N1  | place    | village | 10 -10   |
-
-     Scenario: Updating postcode in postcode boundaries without ref
-        Given the grid
-          | 1 | 2 |
-          | 4 | 3 |
-        Given the places
-          | osm | class    | type        | postcode | geometry |
-          | R1  | boundary | postal_code | 12345    | (1,2,3,4,1) |
-        When importing
-        And sending search query "12345"
-        Then results contain
-         | ID | osm |
-         | 0  | R1 |
-        When updating places
-          | osm | class    | type        | postcode | geometry |
-          | R1  | boundary | postal_code | 54321    | (1,2,3,4,1) |
-        And sending search query "12345"
-        Then exactly 0 results are returned
-        When sending search query "54321"
-        Then results contain
-         | ID | osm |
-         | 0  | R1 |
+        And geocoding "Foo"
+        Then result 0 contains
+         | object | category | type    | centroid!wkt |
+         | N1     | place    | village | 10 -10   |
 
     # github #1763
     Scenario: Correct translation of highways under construction
@@ -44,8 +21,8 @@ Feature: Searching of simple objects
          | W1  | highway | construction | The build | 1,2      |
          | N1  | amenity | cafe         | Bean      | 9        |
         When importing
-        And sending json search query "Bean" with address
-        Then result addresses contain
+        And geocoding "Bean"
+        Then result 0 contains in field address
          | amenity | road |
          | Bean    | The build |
 
@@ -57,11 +34,11 @@ Feature: Searching of simple objects
          | osm | class   | type       | name        | housenr |
          | N20 | amenity | restaurant | Red Way     | 34      |
         When importing
-        And sending search query "Wood Street 45"
+        And geocoding "Wood Street 45"
         Then exactly 0 results are returned
-        When sending search query "Red Way 34"
-        Then results contain
-         | osm |
+        When geocoding "Red Way 34"
+        Then all results contain
+         | object |
          | N20 |
 
      Scenario: when the housenumber is missing the street is still returned
@@ -71,12 +48,11 @@ Feature: Searching of simple objects
          | osm | class   | type        | name        | geometry |
          | W1  | highway | residential | Wood Street | 1, 2     |
         When importing
-        And sending search query "Wood Street"
-        Then results contain
-         | osm |
+        And geocoding "Wood Street"
+        Then all results contain
+         | object |
          | W1  |
 
-
      Scenario Outline: Special cased american states will be found
         Given the grid
          | 1 |    | 2 |
@@ -90,15 +66,15 @@ Feature: Searching of simple objects
          | N2   | place | town  | <city> | 10          |
          | N3   | place | city  | <city>  | country:ca  |
         When importing
-        And sending search query "<city>, <state>"
-        Then results contain
-         | osm |
+        And geocoding "<city>, <state>"
+        Then all results contain
+         | object |
          | N2  |
-        When sending search query "<city>, <ref>"
+        When geocoding "<city>, <ref>"
          | accept-language |
          | en |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | N2  |
 
      Examples:
diff --git a/test/bdd/db/update/country.feature b/test/bdd/features/db/update/country.feature
similarity index 72%
rename from test/bdd/db/update/country.feature
rename to test/bdd/features/db/update/country.feature
index abc1af09..75e552c7 100644
--- a/test/bdd/db/update/country.feature
+++ b/test/bdd/features/db/update/country.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Country handling
     Tests for update of country information
 
@@ -16,14 +15,14 @@ Feature: Country handling
             | osm | class    | type          | name  |
             | N10 | place    | town          | Wenig |
         When importing
-        When sending search query "Wenig, Loudou"
-        Then results contain
-            | osm |
+        When geocoding "Wenig, Loudou"
+        Then all results contain
+            | object |
             | N10 |
         When updating places
             | osm | class    | type           | admin | name+name:xy | country | geometry |
             | R1  | boundary | administrative | 2     | Germany      | de      | (1,2,3,4,1) |
-        When sending search query "Wenig, Loudou"
+        When geocoding "Wenig, Loudou"
         Then exactly 0 results are returned
 
     Scenario: When country names are deleted they are no longer searchable
@@ -34,21 +33,21 @@ Feature: Country handling
             | osm | class    | type          | name  |
             | N10 | place    | town          | Wenig |
         When importing
-        When sending search query "Wenig, Loudou"
-        Then results contain
-            | osm |
+        When geocoding "Wenig, Loudou"
+        Then all results contain
+            | object |
             | N10 |
         When updating places
             | osm | class    | type           | admin | name+name:en | country | geometry |
             | R1  | boundary | administrative | 2     | Germany      | de      | (1,2,3,4,1) |
-        When sending search query "Wenig, Loudou"
+        When geocoding "Wenig, Loudou"
         Then exactly 0 results are returned
-        When sending search query "Wenig"
+        When geocoding "Wenig"
             | accept-language |
             | xy,en |
-        Then results contain
-            | osm | display_name |
-            | N10 | Wenig, Germany |
+        Then all results contain
+            | object | display_name |
+            | N10    | Wenig, Germany |
 
 
     Scenario: Default country names are always searchable
@@ -56,29 +55,29 @@ Feature: Country handling
             | osm | class    | type          | name  |
             | N10 | place    | town          | Wenig |
         When importing
-        When sending search query "Wenig, Germany"
-        Then results contain
-            | osm |
+        When geocoding "Wenig, Germany"
+        Then all results contain
+            | object |
             | N10 |
-        When sending search query "Wenig, de"
-        Then results contain
-            | osm |
+        When geocoding "Wenig, de"
+        Then all results contain
+            | object |
             | N10 |
         When updating places
             | osm  | class    | type           | admin | name+name:en | country | geometry |
             | R1   | boundary | administrative | 2     | Lilly        | de      | (1,2,3,4,1) |
-        When sending search query "Wenig, Germany"
+        When geocoding "Wenig, Germany"
             | accept-language |
             | en,de |
-        Then results contain
-            | osm | display_name |
+        Then all results contain
+            | object | display_name |
             | N10 | Wenig, Lilly |
-        When sending search query "Wenig, de"
+        When geocoding "Wenig, de"
             | accept-language |
             | en,de |
-        Then results contain
-            | osm | display_name |
-            | N10 | Wenig, Lilly |
+        Then all results contain
+            | object | display_name |
+            | N10    | Wenig, Lilly |
 
 
     Scenario: When a localised name is deleted, the standard name takes over
@@ -89,21 +88,21 @@ Feature: Country handling
             | osm | class    | type          | name  |
             | N10 | place    | town          | Wenig |
         When importing
-        When sending search query "Wenig, Loudou"
+        When geocoding "Wenig, Loudou"
             | accept-language |
             | de,en |
-        Then results contain
-            | osm | display_name |
+        Then all results contain
+            | object | display_name |
             | N10 | Wenig, Loudou |
         When updating places
             | osm | class    | type           | admin | name+name:en | country | geometry |
             | R1  | boundary | administrative | 2     | Germany      | de      | (1,2,3,4,1) |
-        When sending search query "Wenig, Loudou"
+        When geocoding "Wenig, Loudou"
         Then exactly 0 results are returned
-        When sending search query "Wenig"
+        When geocoding "Wenig"
             | accept-language |
             | de,en |
-        Then results contain
-            | osm | display_name |
-            | N10 | Wenig, Deutschland |
+        Then all results contain
+            | object | display_name |
+            | N10    | Wenig, Deutschland |
 
diff --git a/test/bdd/db/update/interpolation.feature b/test/bdd/features/db/update/interpolation.feature
similarity index 99%
rename from test/bdd/db/update/interpolation.feature
rename to test/bdd/features/db/update/interpolation.feature
index 421fdc01..e548862b 100644
--- a/test/bdd/db/update/interpolation.feature
+++ b/test/bdd/features/db/update/interpolation.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Update of address interpolations
     Test the interpolated address are updated correctly
 
@@ -334,7 +333,7 @@ Feature: Update of address interpolations
           | W1              | 4     | 4   |
           | W1              | 8     | 8   |
 
-    @Fail
+    @skip
     Scenario: housenumber removed in middle of interpolation
       Given the grid
           | 1 |  |  |   |  | 2 |
diff --git a/test/bdd/db/update/linked_places.feature b/test/bdd/features/db/update/linked_places.feature
similarity index 92%
rename from test/bdd/db/update/linked_places.feature
rename to test/bdd/features/db/update/linked_places.feature
index d6370ebb..d622cbfb 100644
--- a/test/bdd/db/update/linked_places.feature
+++ b/test/bdd/features/db/update/linked_places.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Updates of linked places
     Tests that linked places are correctly added and deleted.
 
@@ -40,11 +39,11 @@ Feature: Updates of linked places
         Then placex contains
          | object | linked_place_id |
          | N1     | R1 |
-        When sending search query "foo"
+        When geocoding "foo"
          | dups |
          | 1    |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | R1 |
         When updating places
          | osm | class    | type           | name   | admin | geometry |
@@ -52,11 +51,11 @@ Feature: Updates of linked places
         Then placex contains
          | object | linked_place_id |
          | N1     | - |
-        When sending search query "foo"
+        When geocoding "foo"
          | dups |
          | 1    |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | N1 |
 
     Scenario: Add linked place when linking relation is removed
@@ -71,21 +70,21 @@ Feature: Updates of linked places
             | osm | class    | type           | name | admin | geometry |
             | R1  | boundary | administrative | foo  | 8     | (10,11,12,13,10) |
         When importing
-        And sending search query "foo"
+        And geocoding "foo"
          | dups |
          | 1    |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | R1 |
         When marking for delete R1
         Then placex contains
          | object | linked_place_id |
          | N1     | - |
-        When sending search query "foo"
+        When geocoding "foo"
          | dups |
          | 1    |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | N1 |
 
     Scenario: Remove linked place when linking relation is added
@@ -97,11 +96,11 @@ Feature: Updates of linked places
             | osm | class | type | name |
             | N1  | place | city | foo  |
         When importing
-        And sending search query "foo"
+        And geocoding "foo"
          | dups |
          | 1    |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | N1 |
         When updating places
          | osm | class    | type           | name   | admin | geometry |
@@ -109,11 +108,11 @@ Feature: Updates of linked places
         Then placex contains
          | object | linked_place_id |
          | N1     | R1 |
-        When sending search query "foo"
+        When geocoding "foo"
          | dups |
          | 1    |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | R1 |
 
     Scenario: Remove linked place when linking relation is renamed
@@ -128,11 +127,11 @@ Feature: Updates of linked places
          | osm | class    | type           | name   | admin | geometry |
          | R1  | boundary | administrative | foobar | 8     | (10,11,12,13,10) |
         When importing
-        And sending search query "foo"
+        And geocoding "foo"
          | dups |
          | 1    |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | N1 |
         When updating places
          | osm | class    | type           | name   | admin | geometry |
@@ -140,11 +139,11 @@ Feature: Updates of linked places
         Then placex contains
          | object | linked_place_id |
          | N1     | R1 |
-        When sending search query "foo"
+        When geocoding "foo"
          | dups |
          | 1    |
-        Then results contain
-         | osm |
+        Then all results contain
+         | object |
          | R1 |
 
     Scenario: Update linking relation when linkee name is updated
@@ -199,9 +198,9 @@ Feature: Updates of linked places
         And placex contains
          | object | linked_place_id | name+name |
          | N3     | R1              | greeny  |
-        When sending search query "greeny"
-        Then results contain
-          | osm |
+        When geocoding "greeny"
+        Then all results contain
+          | object |
           | R1  |
         When updating places
          | osm | class    | type        | name+name:de |
@@ -212,7 +211,7 @@ Feature: Updates of linked places
         And placex contains
          | object | linked_place_id | name+_place_name:de | name+name |
          | R1     | -               | depnt               | rel       |
-        When sending search query "greeny"
+        When geocoding "greeny"
         Then exactly 0 results are returned
 
     Scenario: Updating linkee extratags keeps linker's extratags
@@ -231,13 +230,13 @@ Feature: Updates of linked places
          | 1  | N3:label |
         When importing
         Then placex contains
-         | object | extratags |
+         | object | extratags!dict |
          | R1     | 'wikidata' : '34', 'linked_place' : 'city' |
         When updating places
          | osm | class    | type        | name    | extra+oneway |
          | N3  | place    | city        | newname | yes          |
         Then placex contains
-         | object | extratags |
+         | object | extratags!dict |
          | R1     | 'wikidata' : '34', 'oneway' : 'yes', 'linked_place' : 'city' |
 
     Scenario: Remove linked_place info when linkee is removed
@@ -253,7 +252,7 @@ Feature: Updates of linked places
             | R1  | boundary | administrative | foo  | 8     | (10,11,12,13,10) |
         When importing
         Then placex contains
-            | object | extratags |
+            | object | extratags!dict |
             | R1     | 'linked_place' : 'city' |
         When marking for delete N1
         Then placex contains
@@ -273,13 +272,13 @@ Feature: Updates of linked places
             | R1  | boundary | administrative | foo  | 8     | (10,11,12,13,10) |
         When importing
         Then placex contains
-            | object | extratags |
+            | object | extratags!dict |
             | R1     | 'linked_place' : 'city' |
         When updating places
             | osm | class | type | name |
             | N1  | place | town | foo  |
         Then placex contains
-            | object | extratags |
+            | object | extratags!dict |
             | R1     | 'linked_place' : 'town' |
 
 
diff --git a/test/bdd/db/update/naming.feature b/test/bdd/features/db/update/naming.feature
similarity index 83%
rename from test/bdd/db/update/naming.feature
rename to test/bdd/features/db/update/naming.feature
index 6c1a817b..2912a7da 100644
--- a/test/bdd/db/update/naming.feature
+++ b/test/bdd/features/db/update/naming.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Update of names in place objects
     Test all naming related issues in updates
 
@@ -10,10 +9,10 @@ Feature: Update of names in place objects
           | osm | class    | type        | postcode | geometry |
           | R1  | boundary | postal_code | 123-45    | (1,2,3,4,1) |
         When importing
-        And sending search query "123-45"
-        Then results contain
-         | ID | osm |
-         | 0  | R1 |
+        And geocoding "123-45"
+        Then result 0 contains
+         | object |
+         | R1 |
         When updating places
           | osm | class    | type        | geometry |
           | R1  | boundary | postal_code | (1,2,3,4,1) |
diff --git a/test/bdd/db/update/parenting.feature b/test/bdd/features/db/update/parenting.feature
similarity index 99%
rename from test/bdd/db/update/parenting.feature
rename to test/bdd/features/db/update/parenting.feature
index 1a23d903..28f74cbe 100644
--- a/test/bdd/db/update/parenting.feature
+++ b/test/bdd/features/db/update/parenting.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Update parenting of objects
 
     Scenario: POI inside building inherits addr:street change
@@ -111,7 +110,7 @@ Feature: Update parenting of objects
 
 
     # Invalidation of geometries currently disabled for addr:place matches.
-    @Fail
+    @skip
     Scenario: Housenumber is reparented when place is renamed to matching addr:place
         Given the grid
          | 1 |    |   | 2 |
diff --git a/test/bdd/db/update/postcode.feature b/test/bdd/features/db/update/postcode.feature
similarity index 61%
rename from test/bdd/db/update/postcode.feature
rename to test/bdd/features/db/update/postcode.feature
index 39318101..d62953e7 100644
--- a/test/bdd/db/update/postcode.feature
+++ b/test/bdd/features/db/update/postcode.feature
@@ -1,51 +1,68 @@
-@DB
 Feature: Update of postcode
     Tests for updating of data related to postcodes
 
-    Scenario: A new postcode appears in the postcode and word table
+     Scenario: Updating postcode in postcode boundaries without ref
+        Given the grid
+          | 1 | 2 |
+          | 4 | 3 |
+        Given the places
+          | osm | class    | type        | postcode | geometry |
+          | R1  | boundary | postal_code | 12345    | (1,2,3,4,1) |
+        When importing
+        And geocoding "12345"
+        Then result 0 contains
+         | object |
+         | R1 |
+        When updating places
+          | osm | class    | type        | postcode | geometry |
+          | R1  | boundary | postal_code | 54321    | (1,2,3,4,1) |
+        And geocoding "12345"
+        Then exactly 0 results are returned
+        When geocoding "54321"
+        Then result 0 contains
+         | object |
+         | R1 |
+
+    Scenario: A new postcode appears in the postcode table
         Given the places
            | osm | class | type  | addr+postcode | addr+housenumber | geometry |
-           | N34 | place | house | 01982         | 111              |country:de |
+           | N34 | place | house | 01982         | 111              | country:de |
         When importing
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | de      | 01982    | country:de |
+           | country_code | postcode | geometry!wkt |
+           | de           | 01982    | country:de |
         When updating places
            | osm | class | type  | addr+postcode | addr+housenumber | geometry |
-           | N35 | place | house | 4567          | 5                |country:ch |
+           | N35 | place | house | 4567          | 5                | country:ch |
         And updating postcodes
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | de      | 01982    | country:de |
-           | ch      | 4567     | country:ch |
-        And there are word tokens for postcodes 01982,4567
+           | country_code | postcode | geometry!wkt |
+           | de           | 01982    | country:de |
+           | ch           | 4567     | country:ch |
 
-     Scenario: When the last postcode is deleted, it is deleted from postcode and word
+     Scenario: When the last postcode is deleted, it is deleted from postcode
         Given the places
            | osm | class | type  | addr+postcode | addr+housenumber | geometry |
-           | N34 | place | house | 01982         | 111              |country:de |
-           | N35 | place | house | 4567          | 5                |country:ch |
+           | N34 | place | house | 01982         | 111              | country:de |
+           | N35 | place | house | 4567          | 5                | country:ch |
         When importing
         And marking for delete N34
         And updating postcodes
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | ch      | 4567     | country:ch |
-        And there are word tokens for postcodes 4567
-        And there are no word tokens for postcodes 01982
+           | country_code | postcode | geometry!wkt |
+           | ch           | 4567     | country:ch |
 
-     Scenario: A postcode is not deleted from postcode and word when it exist in another country
+     Scenario: A postcode is not deleted from postcode when it exist in another country
         Given the places
            | osm | class | type  | addr+postcode | addr+housenumber | geometry |
-           | N34 | place | house | 01982         | 111              |country:de |
-           | N35 | place | house | 01982         | 5                |country:fr |
+           | N34 | place | house | 01982         | 111              | country:de |
+           | N35 | place | house | 01982         | 5                | country:fr |
         When importing
         And marking for delete N34
         And updating postcodes
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | fr      | 01982    | country:fr |
-        And there are word tokens for postcodes 01982
+           | country_code | postcode | geometry!wkt|
+           | fr           | 01982    | country:fr |
 
      Scenario: Updating a postcode is reflected in postcode table
         Given the places
@@ -57,9 +74,8 @@ Feature: Update of postcode
            | N34 | place | postcode | 20453         | country:de |
         And updating postcodes
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | de      | 20453    | country:de |
-        And there are word tokens for postcodes 20453
+           | country_code | postcode | geometry!wkt |
+           | de           | 20453    | country:de |
 
      Scenario: When changing from a postcode type, the entry appears in placex
         When importing
@@ -71,16 +87,15 @@ Feature: Update of postcode
            | osm | class | type  | addr+postcode | housenr |  geometry |
            | N34 | place | house | 20453         | 1       | country:de |
         Then placex contains
-           | object | addr+housenumber | geometry |
-           | N34    | 1                | country:de|
+           | object | addr+housenumber | geometry!wkt |
+           | N34    | 1                | country:de |
         And place contains exactly
-           | object | class | type  |
-           | N34    | place | house |
+           | osm_type | osm_id | class | type  |
+           | N        | 34     | place | house |
         When updating postcodes
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | de      | 20453    | country:de |
-        And there are word tokens for postcodes 20453
+           | country_code | postcode | geometry!wkt |
+           | de           | 20453    | country:de |
 
      Scenario: When changing to a postcode type, the entry disappears from placex
         When importing
@@ -88,20 +103,19 @@ Feature: Update of postcode
            | osm | class | type  | addr+postcode | housenr |  geometry |
            | N34 | place | house | 20453         | 1       | country:de |
         Then placex contains
-           | object | addr+housenumber | geometry |
+           | object | addr+housenumber | geometry!wkt |
            | N34    | 1                | country:de|
         When updating places
            | osm | class | type     | addr+postcode |  geometry |
            | N34 | place | postcode | 01982         | country:de |
         Then placex has no entry for N34
         And place contains exactly
-           | object | class | type     |
-           | N34    | place | postcode |
+           | osm_type | osm_id | class | type     |
+           | N        | 34     | place | postcode |
         When updating postcodes
         Then location_postcode contains exactly
-           | country | postcode | geometry |
-           | de      | 01982    | country:de |
-        And there are word tokens for postcodes 01982
+           | country_code | postcode | geometry!wkt |
+           | de           | 01982    | country:de |
 
     Scenario: When a parent is deleted, the postcode gets a new parent
         Given the grid with origin DE
@@ -112,15 +126,14 @@ Feature: Update of postcode
            | osm | class    | type           | name  | admin | geometry    |
            | R1  | boundary | administrative | Big   | 6     | (1,4,6,2,1) |
            | R2  | boundary | administrative | Small | 6     | (1,3,5,2,1) |
-        Given the named places
+        Given the places
            | osm | class | type     | addr+postcode | geometry |
            | N9  | place | postcode | 12345         | 9        |
         When importing
-        And updating postcodes
         Then location_postcode contains exactly
-           | country | postcode | geometry | parent_place_id |
-           | de      | 12345    | 9        | R2              |
+           | postcode | geometry!wkt | parent_place_id |
+           | 12345    | 9            | R2              |
         When marking for delete R2
         Then location_postcode contains exactly
-           | country | postcode | geometry | parent_place_id |
-           | de      | 12345    | 9        | R1              |
+           | country_code | postcode | geometry!wkt | parent_place_id |
+           | de           | 12345    | 9            | R1              |
diff --git a/test/bdd/db/update/simple.feature b/test/bdd/features/db/update/simple.feature
similarity index 95%
rename from test/bdd/db/update/simple.feature
rename to test/bdd/features/db/update/simple.feature
index 73abcd22..22165c2f 100644
--- a/test/bdd/db/update/simple.feature
+++ b/test/bdd/features/db/update/simple.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Update of simple objects
     Testing simple updating functionality
 
@@ -47,7 +46,9 @@ Feature: Update of simple objects
           | R1     | 0 |
           | R2     | 26 |
           | W1     | 30 |
-        When marking for delete R1,R2,W1
+        When marking for delete R1
+        And marking for delete R2
+        And marking for delete W1
         Then placex has no entry for W1
         Then placex has no entry for R1
         Then placex has no entry for R2
@@ -58,13 +59,13 @@ Feature: Update of simple objects
           | N3  | shop  | toys | 1 -1 |
         When importing
         Then placex contains
-          | object | class | type | centroid |
+          | object | class | type | centroid!wkt |
           | N3     | shop  | toys | 1 -1 |
         When updating places
           | osm | class | type    | geometry |
           | N3  | shop  | grocery | 1 -1 |
         Then placex contains
-          | object | class | type    | centroid |
+          | object | class | type    | centroid!wkt |
           | N3     | shop  | grocery | 1 -1 |
 
     Scenario: remove postcode place when house number is added
diff --git a/test/bdd/osm2pgsql/import/broken.feature b/test/bdd/features/osm2pgsql/import/broken.feature
similarity index 64%
rename from test/bdd/osm2pgsql/import/broken.feature
rename to test/bdd/features/osm2pgsql/import/broken.feature
index 13b9a088..6f04a30f 100644
--- a/test/bdd/osm2pgsql/import/broken.feature
+++ b/test/bdd/features/osm2pgsql/import/broken.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Import of objects with broken geometries by osm2pgsql
 
     Scenario: Import way with double nodes
@@ -10,23 +9,27 @@ Feature: Import of objects with broken geometries by osm2pgsql
           w1 Thighway=primary Nn100,n101,n101,n102
           """
         Then place contains
-          | object | class   | type    | geometry |
+          | object | class   | type    | geometry!wkt |
           | W1     | highway | primary | 0 0, 0 0.1, 0.1 0.2 |
 
     Scenario: Import of ballon areas
+        Given the grid
+         | 2 |  | 3 |
+         | 1 |  | 4 |
+         | 5 |  |   |
         When loading osm data
           """
-          n1   x0 y0
-          n2   x0 y0.0001
-          n3   x0.00001 y0.0001
-          n4   x0.00001 y0
-          n5   x-0.00001 y0
+          n1
+          n2
+          n3
+          n4
+          n5
           w1 Thighway=unclassified Nn1,n2,n3,n4,n1,n5
           w2 Thighway=unclassified Nn1,n2,n3,n4,n1
           w3 Thighway=unclassified Nn1,n2,n3,n4,n3
           """
         Then place contains
-          | object | geometrytype |
-          | W1     | ST_LineString |
-          | W2     | ST_Polygon |
-          | W3     | ST_LineString |
+          | object | geometry!wkt |
+          | W1     | 1,2,3,4,1,5  |
+          | W2     | (1,2,3,4,1)  |
+          | W3     | 1,2,3,4      |
diff --git a/test/bdd/osm2pgsql/import/custom_style.feature b/test/bdd/features/osm2pgsql/import/custom_style.feature
similarity index 50%
rename from test/bdd/osm2pgsql/import/custom_style.feature
rename to test/bdd/features/osm2pgsql/import/custom_style.feature
index 2ca95c91..05ab73aa 100644
--- a/test/bdd/osm2pgsql/import/custom_style.feature
+++ b/test/bdd/features/osm2pgsql/import/custom_style.feature
@@ -1,8 +1,7 @@
-@DB
 Feature: Import with custom styles by osm2pgsql
     Tests for the example customizations given in the documentation.
 
-    Scenario: Custom main tags
+    Scenario: Custom main tags (set new ones)
         Given the lua style file
             """
             local flex = require('import-full')
@@ -28,6 +27,35 @@ Feature: Import with custom styles by osm2pgsql
             | N13    | highway  | primary        |
             | N15    | highway  | primary        |
 
+    Scenario: Custom main tags (modify existing)
+        Given the lua style file
+            """
+            local flex = require('import-full')
+
+            flex.modify_main_tags{
+                amenity = {prison = 'delete'},
+                highway = {stop = 'named'},
+                aeroway = 'named'
+            }
+            """
+        When loading osm data
+            """
+            n10 Tamenity=hotel x0 y0
+            n11 Tamenity=prison x0 y0
+            n12 Thighway=stop x0 y0
+            n13 Thighway=stop,name=BigStop x0 y0
+            n14 Thighway=give_way x0 y0
+            n15 Thighway=bus_stop x0 y0
+            n16 Taeroway=no,name=foo x0 y0
+            n17 Taeroway=taxiway,name=D15 x0 y0
+            """
+        Then place contains exactly
+            | object | class   | type     |
+            | N10    | amenity | hotel    |
+            | N13    | highway | stop     |
+            | N15    | highway | bus_stop |
+            | N17    | aeroway | taxiway  |
+
     Scenario: Prefiltering tags
         Given the lua style file
             """
@@ -50,11 +78,43 @@ Feature: Import with custom styles by osm2pgsql
             n4 Ttourism=hotel,amenity=telephone x0 y0
             """
         Then place contains exactly
-            | object     | extratags              |
-            | N2:amenity | -                      |
-            | N3:tourism | 'amenity': 'yes'       |
-            | N4:tourism | - |
-            | N4:amenity | - |
+            | object | class   | extratags!dict   |
+            | N2     | amenity | -                |
+            | N3     | tourism | 'amenity': 'yes' |
+            | N4     | tourism | -                |
+            | N4     | amenity | -                |
+
+    Scenario: Ignore some tags
+        Given the lua style file
+            """
+            local flex = require('import-extratags')
+
+            flex.ignore_keys{'ref:*', 'surface'}
+            """
+        When loading osm data
+            """
+            n100 Thighway=residential,ref=34,ref:bodo=34,surface=gray,extra=1 x0 y0
+            """
+        Then place contains exactly
+            | object | name!dict    | extratags!dict |
+            | N100   | 'ref' : '34' | 'extra': '1'   |
+
+
+    Scenario: Add for extratags
+        Given the lua style file
+            """
+            local flex = require('import-full')
+
+            flex.add_for_extratags{'ref:*', 'surface'}
+            """
+        When loading osm data
+            """
+            n100 Thighway=residential,ref=34,ref:bodo=34,surface=gray,extra=1 x0 y0
+            """
+        Then place contains exactly
+            | object | name!dict    | extratags!dict  |
+            | N100   | 'ref' : '34' | 'ref:bodo': '34', 'surface': 'gray' |
+
 
     Scenario: Name tags
         Given the lua style file
@@ -74,9 +134,25 @@ Feature: Import with custom styles by osm2pgsql
             n4 Thighway=traffic_light,name=Red,ref=45 x0 y0
             """
         Then place contains exactly
-            | object     | name                       |
-            | N3:highway | 'name': 'Greens'           |
-            | N4:highway | 'name': 'Red', 'ref': '45' |
+            | object | class   | name!dict                  |
+            | N3     | highway | 'name': 'Greens'           |
+            | N4     | highway | 'name': 'Red', 'ref': '45' |
+
+    Scenario: Modify name tags
+        Given the lua style file
+            """
+            local flex = require('import-full')
+
+            flex.modify_name_tags{house = {}, extra = {'o'}}
+            """
+        When loading osm data
+            """
+            n1 Ttourism=hotel,ref=45,o=good
+            n2 Taddr:housename=Old,addr:street=Away
+            """
+        Then place contains exactly
+            | object | class   | name!dict   |
+            | N1     | tourism | 'o': 'good' |
 
     Scenario: Address tags
         Given the lua style file
@@ -97,11 +173,28 @@ Feature: Import with custom styles by osm2pgsql
             n3 Taddr:street=None,addr:city=Where x0 y0
             """
         Then place contains exactly
-            | object     | type  | address |
-            | N1:tourism | hotel | 'street': 'Foo' |
-            | N2:place   | house | 'housenumber': '23', 'street': 'Budd', 'postcode': '5567' |
+            | object | class   | type  | address!dict |
+            | N1     | tourism | hotel | 'street': 'Foo' |
+            | N2     | place   | house | 'housenumber': '23', 'street': 'Budd', 'postcode': '5567' |
+
+    Scenario: Modify address tags
+        Given the lua style file
+            """
+            local flex = require('import-full')
+
+            flex.set_address_tags{
+                extra = {'addr:*'},
+            }
+            """
+        When loading osm data
+            """
+            n2 Taddr:housenumber=23,addr:street=Budd,is_in:city=Faraway,postal_code=5567 x0 y0
+            """
+        Then place contains exactly
+            | object | class | type  | address!dict |
+            | N2     | place | house | 'housenumber': '23', 'street': 'Budd', 'postcode': '5567' |
 
-    Scenario: Unused handling
+    Scenario: Unused handling (delete)
         Given the lua style file
             """
             local flex = require('import-full')
@@ -118,9 +211,34 @@ Feature: Import with custom styles by osm2pgsql
             n2 Ttourism=hotel,tiger:xxd=56,else=other x0 y0
             """
         Then place contains exactly
-            | object     | type  | address                 | extratags        |
-            | N1:tourism | hotel | 'tiger:county': 'Fargo' | -                |
-            | N2:tourism | hotel | -                       | 'else': 'other'  |
+            | object | class   | type  | address!dict            | extratags!dict   |
+            | N1     | tourism | hotel | 'tiger:county': 'Fargo' | -                |
+            | N2     | tourism | hotel | -                       | 'else': 'other'  |
+
+    Scenario: Unused handling (extra)
+        Given the lua style file
+            """
+            local flex = require('flex-base')
+            flex.set_main_tags{highway = 'always',
+                               wikipedia = 'extra'}
+            flex.add_for_extratags{'wikipedia:*', 'wikidata'}
+            flex.set_unused_handling{extra_keys = {'surface'}}
+            """
+        When loading osm data
+            """
+            n100 Thighway=path,foo=bar,wikipedia=en:Path x0 y0
+            n234 Thighway=path,surface=rough x0 y0
+            n445 Thighway=path,name=something x0 y0
+            n446 Thighway=path,wikipedia:en=Path,wikidata=Q23 x0 y0
+            n567 Thighway=path,surface=dirt,wikipedia:en=Path x0 y0
+            """
+        Then place contains exactly
+            | object | class   | type  | extratags!dict         |
+            | N100   | highway | path  | 'wikipedia': 'en:Path' |
+            | N234   | highway | path  | 'surface': 'rough' |
+            | N445   | highway | path  | - |
+            | N446   | highway | path  | 'wikipedia:en': 'Path', 'wikidata': 'Q23' |
+            | N567   | highway | path  | 'surface': 'dirt', 'wikipedia:en': 'Path' |
 
     Scenario: Additional relation types
         Given the lua style file
@@ -143,9 +261,9 @@ Feature: Import with custom styles by osm2pgsql
             r2 Ttype=site,amenity=school Mw1@
             """
         Then place contains exactly
-            | object     | type   |
-            | R1:amenity | school |
-            | R2:amenity | school |
+            | object | class   | type   |
+            | R1     | amenity | school |
+            | R2     | amenity | school |
 
     Scenario: Exclude country relations
         Given the lua style file
@@ -172,8 +290,8 @@ Feature: Import with custom styles by osm2pgsql
             r2 Ttype=multipolygon,boundary=administrative,admin_level=2,name=Big Mw1@
             """
         Then place contains exactly
-            | object      | type           |
-            | R1:boundary | administrative |
+            | object | class    | type           |
+            | R1     | boundary | administrative |
 
     Scenario: Customize processing functions
         Given the lua style file
@@ -196,5 +314,5 @@ Feature: Import with custom styles by osm2pgsql
             n2 Thighway=residential,access=no x0 y0
             """
         Then place contains exactly
-            | object     | type        |
-            | N1:highway | residential |
+            | object | class   | type        |
+            | N1     | highway | residential |
diff --git a/test/bdd/osm2pgsql/import/relation.feature b/test/bdd/features/osm2pgsql/import/relation.feature
similarity index 98%
rename from test/bdd/osm2pgsql/import/relation.feature
rename to test/bdd/features/osm2pgsql/import/relation.feature
index 7010779e..13d4278e 100644
--- a/test/bdd/osm2pgsql/import/relation.feature
+++ b/test/bdd/features/osm2pgsql/import/relation.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Import of relations by osm2pgsql
     Testing specific relation problems related to members.
 
diff --git a/test/bdd/osm2pgsql/import/simple.feature b/test/bdd/features/osm2pgsql/import/simple.feature
similarity index 78%
rename from test/bdd/osm2pgsql/import/simple.feature
rename to test/bdd/features/osm2pgsql/import/simple.feature
index 5e329c6a..217c2b7c 100644
--- a/test/bdd/osm2pgsql/import/simple.feature
+++ b/test/bdd/features/osm2pgsql/import/simple.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Import of simple objects by osm2pgsql
     Testing basic tagging in osm2pgsql imports.
 
@@ -18,7 +17,7 @@ Feature: Import of simple objects by osm2pgsql
           r1 Ttype=multipolygon,tourism=hotel,name=XZ Mn1@,w2@
           """
         Then place contains exactly
-          | object | class   | type   | name            | geometry |
+          | object | class   | type   | name!dict       | geometry!wkt |
           | N1     | amenity | prison | 'name' : 'foo'  | 34.3 -23 |
           | W1     | shop    | toys   | 'name' : 'tata' | 0 0, 0 0.1, 0.1 0.2 |
           | R1     | tourism | hotel  | 'name' : 'XZ'   | (0 0, 0 1, 1 1, 1 0, 0 0) |
@@ -28,16 +27,16 @@ Feature: Import of simple objects by osm2pgsql
           """
           n1 Ttourism=hotel,amenity=restaurant,name=foo
           """
-        Then place contains
-          | object     | type       | name |
-          | N1:tourism | hotel      | 'name' : 'foo' |
-          | N1:amenity | restaurant | 'name' : 'foo' |
+        Then place contains exactly
+          | object | class   | type       | name!dict      |
+          | N1     | tourism | hotel      | 'name' : 'foo' |
+          | N1     | amenity | restaurant | 'name' : 'foo' |
 
     Scenario: Import stand-alone house number with postcode
         When loading osm data
           """
           n1 Taddr:housenumber=4,addr:postcode=3345
           """
-        Then place contains
+        Then place contains exactly
           | object | class | type |
           | N1     | place | house |
diff --git a/test/bdd/osm2pgsql/import/tags.feature b/test/bdd/features/osm2pgsql/import/tags.feature
similarity index 57%
rename from test/bdd/osm2pgsql/import/tags.feature
rename to test/bdd/features/osm2pgsql/import/tags.feature
index 7958f4b3..0671a43f 100644
--- a/test/bdd/osm2pgsql/import/tags.feature
+++ b/test/bdd/features/osm2pgsql/import/tags.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Tag evaluation
     Tests if tags are correctly imported into the place table
 
@@ -30,16 +29,16 @@ Feature: Tag evaluation
             n2006 Thighway=yes,name:%9%de=Foo,name=rea\l3
             """
         Then place contains exactly
-            | object | class   | type | name |
+            | object | class   | type | name!dict |
             | N2001  | highway | road | 'name': 'Foo', 'alt_name:de': 'Bar', 'ref': '45' |
             | N2002  | highway | road | - |
             | N2003  | highway | yes  | 'name: de': 'Foo', 'name': 'real1' |
-            | N2004  | highway | yes  | 'name:\nde': 'Foo', 'name': 'real2' |
-            | N2005  | highway | yes  | 'name:\tde': 'Foo', 'name:\\\\': 'real3' |
-            | N2006  | highway | yes  | 'name:\tde': 'Foo', 'name': 'rea\\l3' |
+            | N2004  | highway | yes  | 'name:\\nde': 'Foo', 'name': 'real2' |
+            | N2005  | highway | yes  | 'name:\tde': 'Foo', r'name:\\\\': 'real3' |
+            | N2006  | highway | yes  | 'name:\tde': 'Foo', 'name': r'rea\l3' |
 
         And place contains
-            | object | extratags |
+            | object | extratags!dict |
             | N2002  | 'name:prefix': 'Pre', 'name:suffix': 'Post', 'ref:de': '55' |
 
 
@@ -50,7 +49,7 @@ Feature: Tag evaluation
             n3002 Tbridge=yes,bridge:name:en=Rainbow
             """
         Then place contains exactly
-            | object | class   | type | name                 |
+            | object | class   | type | name!dict            |
             | N3001  | bridge  | yes  | 'name': 'GoldenGate' |
             | N3002  | bridge  | yes  | 'name:en': 'Rainbow' |
 
@@ -62,7 +61,7 @@ Feature: Tag evaluation
             n4002 Taddr:streetnumber=10,is_in:city=Rootoo,is_in=Gold
             """
         Then place contains exactly
-            | object | class | address             |
+            | object | class | address!dict |
             | N4001  | place | 'housenumber': '34', 'city': 'Esmarald', 'county': 'Land' |
             | N4002  | place | 'streetnumber': '10', 'city': 'Rootoo' |
 
@@ -78,7 +77,7 @@ Feature: Tag evaluation
             n5006 Tshop=yes,addr:country=France
             """
         Then place contains exactly
-            | object | class | address         |
+            | object | class | address!dict    |
             | N5001  | shop  | 'country': 'DE' |
             | N5002  | shop  | - |
             | N5003  | shop  | - |
@@ -95,7 +94,7 @@ Feature: Tag evaluation
             n6003 Tshop=bank,is_in:postcode=9009
             """
         Then place contains exactly
-            | object | class | address             |
+            | object | class | address!dict        |
             | N6001  | shop  | 'postcode': '12345' |
             | N6002  | shop  | 'postcode': '34343' |
             | N6003  | shop  | -                   |
@@ -111,7 +110,7 @@ Feature: Tag evaluation
             w1 Tboundary=postal_code,ref=3456 Nn1,n2,n3,n4,n1
             """
         Then place contains exactly
-            | object | class    | type        | name          |
+            | object | class    | type        | name!dict     |
             | W1     | boundary | postal_code | 'ref': '3456' |
 
     Scenario: Main with extra
@@ -121,24 +120,24 @@ Feature: Tag evaluation
             n7002 Thighway=primary,bridge=yes,bridge:name=1
             """
         Then place contains exactly
-            | object        | class   | type    | name        | extratags+bridge:name |
-            | N7001         | highway | primary | 'name': '1' | -                     |
-            | N7002:highway | highway | primary | -           | 1                     |
-            | N7002:bridge  | bridge  | yes     | 'name': '1' | 1                     |
+            | object | class   | type    | name!dict   | extratags!dict |
+            | N7001  | highway | primary | 'name': '1' | 'bridge': 'yes' |
+            | N7002  | highway | primary | -           | 'bridge': 'yes', 'bridge:name': '1' |
+            | N7002  | bridge  | yes     | 'name': '1' | 'highway': 'primary', 'bridge:name': '1' |
 
 
     Scenario: Global fallback and skipping
         When loading osm data
             """
             n8001 Tshop=shoes,note:de=Nein,xx=yy
-            n8002 Tshop=shoes,building=no,ele=234
+            n8002 Tshop=shoes,natural=no,ele=234
             n8003 Tshop=shoes,name:source=survey
             """
         Then place contains exactly
-            | object | class | name | extratags    |
-            | N8001  | shop  |  -   | 'xx': 'yy'   |
-            | N8002  | shop  |  -   | 'ele': '234' |
-            | N8003  | shop  |  -   | -            |
+            | object | class | name!dict | extratags!dict |
+            | N8001  | shop  |  -        | 'xx': 'yy'   |
+            | N8002  | shop  |  -        | 'ele': '234' |
+            | N8003  | shop  |  -        | -            |
 
 
     Scenario: Admin levels
@@ -169,14 +168,14 @@ Feature: Tag evaluation
             n10003 Tboundary=administrative,place=island,name=C
             """
         Then place contains
-            | object          | class    | type           | extratags       |
-            | N10001          | boundary | administrative | 'place': 'city' |
+            | object | class    | type           | extratags!dict  |
+            | N10001 | boundary | administrative | 'place': 'city' |
         And place contains
-            | object          | class    | type           |
-            | N10002:boundary | boundary | natural        |
-            | N10002:place    | place    | city           |
-            | N10003:boundary | boundary | administrative |
-            | N10003:place    | place    | island         |
+            | object | class    | type           |
+            | N10002 | boundary | natural        |
+            | N10002 | place    | city           |
+            | N10003 | boundary | administrative |
+            | N10003 | place    | island         |
 
 
     Scenario: Building fallbacks
@@ -203,6 +202,88 @@ Feature: Tag evaluation
             n13002 Taddr:interpolation=even,place=city
             """
         Then place contains exactly
-            | object | class | type   | address                 |
+            | object | class | type   | address!dict            |
             | N13001 | place | houses | 'interpolation': 'odd'  |
             | N13002 | place | houses | 'interpolation': 'even' |
+
+
+    Scenario: Footways
+        When loading osm data
+            """
+            n1 x0.0 y0.0
+            n2 x0 y0.0001
+            w1 Thighway=footway Nn1,n2
+            w2 Thighway=footway,name=Road Nn1,n2
+            w3 Thighway=footway,name=Road,footway=sidewalk Nn1,n2
+            w4 Thighway=footway,name=Road,footway=crossing Nn1,n2
+            w5 Thighway=footway,name=Road,footway=residential Nn1,n2
+            """
+        Then place contains exactly
+            | object | name+name |
+            | W2     | Road      |
+            | W5     | Road      |
+
+
+    Scenario: Tourism information
+        When loading osm data
+            """
+            n100 Ttourism=information
+            n101 Ttourism=information,name=Generic
+            n102 Ttourism=information,information=guidepost
+            n103 Thighway=information,information=house
+            n104 Ttourism=information,information=yes,name=Something
+            n105 Ttourism=information,information=route_marker,name=3
+            """
+        Then place contains exactly
+            | object | class       | type        |
+            | N100   | tourism     | information |
+            | N101   | tourism     | information |
+            | N102   | information | guidepost   |
+            | N103   | highway     | information |
+            | N104   | tourism     | information |
+
+
+    Scenario: Water features
+        When loading osm data
+            """
+            n20 Tnatural=water
+            n21 Tnatural=water,name=SomePond
+            n22 Tnatural=water,water=pond
+            n23 Tnatural=water,water=pond,name=Pond
+            n24 Tnatural=water,water=river,name=BigRiver
+            n25 Tnatural=water,water=yes
+            n26 Tnatural=water,water=yes,name=Random
+            """
+        Then place contains exactly
+            | object | class   | type  |
+            | N21    | natural | water |
+            | N23    | water   | pond  |
+            | N26    | natural | water |
+
+    Scenario: Drop name for address fallback
+        When loading osm data
+            """
+            n1 Taddr:housenumber=23,name=Foo
+            n2 Taddr:housenumber=23,addr:housename=Foo
+            n3 Taddr:housenumber=23
+            """
+        Then place contains exactly
+            | object | class    | type  | address!dict        | name!dict |
+            | N1     | place    | house | 'housenumber': '23' | -    |
+            | N2     | place    | house | 'housenumber': '23' | 'addr:housename': 'Foo' |
+            | N3     | place    | house | 'housenumber': '23' | -    |
+
+
+    Scenario: Waterway locks
+        When loading osm data
+            """
+            n1 Twaterway=river,lock=yes
+            n2 Twaterway=river,lock=yes,lock_name=LeLock
+            n3 Twaterway=river,lock=yes,name=LeWater
+            n4 Tamenity=parking,lock=yes,lock_name=Gold
+            """
+        Then place contains exactly
+            | object | class    | type    | name!dict |
+            | N2     | lock     | yes     | 'name': 'LeLock' |
+            | N3     | waterway | river   | 'name': 'LeWater' |
+            | N4     | amenity  | parking | - |
diff --git a/test/bdd/osm2pgsql/update/interpolations.feature b/test/bdd/features/osm2pgsql/update/interpolations.feature
similarity index 52%
rename from test/bdd/osm2pgsql/update/interpolations.feature
rename to test/bdd/features/osm2pgsql/update/interpolations.feature
index 9ca26285..ca87ed12 100644
--- a/test/bdd/osm2pgsql/update/interpolations.feature
+++ b/test/bdd/features/osm2pgsql/update/interpolations.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Updates of address interpolation objects
     Test that changes to address interpolation objects are correctly
     propagated.
@@ -16,28 +15,28 @@ Feature: Updates of address interpolation objects
             w33 Thighway=residential,name=Tao Nn1,n2
             """
         Then place contains
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
 
         When updating osm data
             """
             w99 Taddr:interpolation=odd Nn1,n2
             """
         Then place contains
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
-            | W99:place | houses |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
+            | W99    | place | houses |
         When indexing
         Then placex contains exactly
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
-            | W33:highway | residential |
+            | object | class   | type   |
+            | N1     | place   | house  |
+            | N2     | place   | house  |
+            | W33    | highway | residential |
         Then location_property_osmline contains exactly
-            | object |
-            | 99:5   |
+            | osm_id | startnumber |
+            | 99     | 5           |
 
 
     Scenario: Delete an existing interpolation
@@ -48,26 +47,26 @@ Feature: Updates of address interpolation objects
             w99 Taddr:interpolation=odd Nn1,n2
             """
         Then place contains
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
-            | W99:place | houses |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
+            | W99    | place | houses |
 
         When updating osm data
             """
             w99 v2 dD
             """
         Then place contains
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
         When indexing
         Then placex contains exactly
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
         Then location_property_osmline contains exactly
-            | object | indexed_status |
+            | osm_id |
 
 
     Scenario: Changing an object to an interpolation
@@ -79,29 +78,29 @@ Feature: Updates of address interpolation objects
             w99 Thighway=residential Nn1,n2
             """
         Then place contains
-            | object      | type   |
-            | N1:place    | house  |
-            | N2:place    | house  |
-            | W99:highway | residential  |
+            | object | class   | type   |
+            | N1     | place   | house  |
+            | N2     | place   | house  |
+            | W99    | highway | residential  |
 
         When updating osm data
             """
             w99 Taddr:interpolation=odd Nn1,n2
             """
         Then place contains
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
-            | W99:place | houses |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
+            | W99    | place | houses |
         When indexing
         Then placex contains exactly
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
-            | W33:highway | residential |
+            | object | class   | type   |
+            | N1     | place   | house  |
+            | N2     | place   | house  |
+            | W33    | highway | residential |
         And location_property_osmline contains exactly
-            | object |
-            | 99:5   |
+            | osm_id | startnumber |
+            | 99     | 5           |
 
 
     Scenario: Changing an interpolation to something else
@@ -112,26 +111,25 @@ Feature: Updates of address interpolation objects
             w99 Taddr:interpolation=odd Nn1,n2
             """
         Then place contains
-            | object      | type   |
-            | N1:place    | house  |
-            | N2:place    | house  |
-            | W99:place | houses |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
+            | W99    | place | houses |
 
         When updating osm data
             """
             w99 Thighway=residential Nn1,n2
             """
         Then place contains
-            | object      | type   |
-            | N1:place    | house  |
-            | N2:place    | house  |
-            | W99:highway | residential  |
+            | object | class   | type   |
+            | N1     | place   | house  |
+            | N2     | place   | house  |
+            | W99    | highway | residential  |
         When indexing
         Then placex contains exactly
-            | object      | type   |
-            | N1:place    | house  |
-            | N2:place    | house  |
-            | W99:highway | residential  |
+            | object | class   | type   |
+            | N1     | place   | house  |
+            | N2     | place   | house  |
+            | W99    | highway | residential  |
         And location_property_osmline contains exactly
-            | object |
-
+            | osm_id |
diff --git a/test/bdd/osm2pgsql/update/postcodes.feature b/test/bdd/features/osm2pgsql/update/postcodes.feature
similarity index 64%
rename from test/bdd/osm2pgsql/update/postcodes.feature
rename to test/bdd/features/osm2pgsql/update/postcodes.feature
index 6bd61af7..607eeccb 100644
--- a/test/bdd/osm2pgsql/update/postcodes.feature
+++ b/test/bdd/features/osm2pgsql/update/postcodes.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Update of postcode only objects
     Tests that changes to objects containing only a postcode are
     propagated correctly.
@@ -7,6 +6,7 @@ Feature: Update of postcode only objects
     Scenario: Adding a postcode-only node
         When loading osm data
             """
+            n1
             """
         Then place contains exactly
             | object |
@@ -16,8 +16,8 @@ Feature: Update of postcode only objects
             n34 Tpostcode=4456
             """
         Then place contains exactly
-            | object    | type     |
-            | N34:place | postcode |
+            | object | class | type     |
+            | N34    | place | postcode |
         When indexing
         Then placex contains exactly
             | object |
@@ -29,8 +29,8 @@ Feature: Update of postcode only objects
             n34 Tpostcode=4456
             """
         Then place contains exactly
-            | object    | type     |
-            | N34:place | postcode |
+            | object | class | type     |
+            | N34    | place | postcode |
 
         When updating osm data
             """
@@ -49,16 +49,16 @@ Feature: Update of postcode only objects
             n34 T<class>=<type>
             """
         Then place contains exactly
-            | object      | type   |
-            | N34:<class> | <type> |
+            | object | class   | type   |
+            | N34    | <class> | <type> |
 
         When updating osm data
             """
             n34 Tpostcode=4456
             """
         Then place contains exactly
-            | object    | type     |
-            | N34:place | postcode |
+            | object | class | type     |
+            | N34    | place | postcode |
         When indexing
         Then placex contains exactly
             | object |
@@ -75,20 +75,20 @@ Feature: Update of postcode only objects
             n34 Tpostcode=4456
             """
         Then place contains exactly
-            | object    | type     |
-            | N34:place | postcode |
+            | object | class | type     |
+            | N34    | place | postcode |
 
         When updating osm data
             """
             n34 T<class>=<type>
             """
         Then place contains exactly
-            | object      | type   |
-            | N34:<class> | <type> |
+            | object | class   | type   |
+            | N34    | <class> | <type> |
         When indexing
         Then placex contains exactly
-            | object      | type   |
-            | N34:<class> | <type> |
+            | object | class   | type   |
+            | N34    | <class> | <type> |
 
         Examples:
             | class   | type       |
@@ -106,27 +106,27 @@ Feature: Update of postcode only objects
             w34 Taddr:interpolation=odd Nn1,n2
             """
         Then place contains exactly
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
-            | W34:place | houses |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
+            | W34    | place | houses |
 
         When updating osm data
             """
             w34 Tpostcode=4456 Nn1,n2
             """
         Then place contains exactly
-            | object    | type     |
-            | N1:place  | house    |
-            | N2:place  | house    |
-            | W34:place | postcode |
+            | object | class | type     |
+            | N1     | place | house    |
+            | N2     | place | house    |
+            | W34    | place | postcode |
         When indexing
         Then location_property_osmline contains exactly
-            | object |
+            | osm_id |
         And placex contains exactly
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
+            | object | class | type   |
+            | N1     | place | house  |
+            | N2     | place | house  |
 
 
     Scenario: Converting a postcode-only node into an interpolation
@@ -140,28 +140,28 @@ Feature: Update of postcode only objects
             w34 Tpostcode=4456 Nn1,n2
             """
         Then place contains exactly
-            | object    | type     |
-            | N1:place  | house    |
-            | N2:place  | house    |
-            | W33:highway | residential |
-            | W34:place | postcode |
+            | object | class   | type     |
+            | N1     | place   | house    |
+            | N2     | place   | house    |
+            | W33    | highway | residential |
+            | W34    | place   | postcode |
 
         When updating osm data
             """
             w34 Taddr:interpolation=odd Nn1,n2
             """
         Then place contains exactly
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
-            | W33:highway | residential |
-            | W34:place | houses |
+            | object | class   | type   |
+            | N1     | place   | house  |
+            | N2     | place   | house  |
+            | W33    | highway | residential |
+            | W34    | place   | houses |
         When indexing
         Then location_property_osmline contains exactly
-            | object |
-            | 34:5   |
+            | osm_id | startnumber | endnumber |
+            | 34     | 5           | 15        |
         And placex contains exactly
-            | object    | type   |
-            | N1:place  | house  |
-            | N2:place  | house  |
-            | W33:highway | residential |
+            | object | class   | type   |
+            | N1     | place   | house  |
+            | N2     | place   | house  |
+            | W33    | highway | residential |
diff --git a/test/bdd/osm2pgsql/update/relation.feature b/test/bdd/features/osm2pgsql/update/relation.feature
similarity index 88%
rename from test/bdd/osm2pgsql/update/relation.feature
rename to test/bdd/features/osm2pgsql/update/relation.feature
index 794ef5c5..302231b4 100644
--- a/test/bdd/osm2pgsql/update/relation.feature
+++ b/test/bdd/features/osm2pgsql/update/relation.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Update of relations by osm2pgsql
     Testing relation update by osm2pgsql.
 
@@ -14,7 +13,7 @@ Feature: Update of relations by osm2pgsql
           r1 Ttype=multipolygon,tourism=hotel,name=XZ Mw2@
           """
         Then place contains
-          | object | class   | type   | name |
+          | object | class   | type   | name!dict |
           | R1     | tourism | hotel  | 'name' : 'XZ' |
           When updating osm data
             """
@@ -34,7 +33,7 @@ Feature: Update of relations by osm2pgsql
           r1 Ttype=multipolygon,tourism=hotel,name=XZ Mw2@
           """
         Then place contains
-          | object | class   | type   | name |
+          | object | class   | type   | name!dict |
           | R1     | tourism | hotel  | 'name' : 'XZ' |
         When updating osm data
           """
@@ -42,7 +41,7 @@ Feature: Update of relations by osm2pgsql
           """
         Then place has no entry for R1:tourism
         And place contains
-          | object | class   | type   | name |
+          | object | class   | type   | name!dict |
           | R1     | amenity | prison | 'name' : 'XZ' |
 
     Scenario: Change name of a relation
@@ -56,14 +55,14 @@ Feature: Update of relations by osm2pgsql
           r1 Ttype=multipolygon,tourism=hotel,name=AB Mw2@
           """
         Then place contains
-          | object | class   | type   | name |
+          | object | class   | type   | name!dict |
           | R1     | tourism | hotel  | 'name' : 'AB' |
         When updating osm data
           """
           r1 Ttype=multipolygon,tourism=hotel,name=XY Mw2@
           """
         Then place contains
-          | object | class   | type   | name |
+          | object | class   | type   | name!dict |
           | R1     | tourism | hotel  | 'name' : 'XY' |
 
     Scenario: Change type of a relation into something unknown
@@ -77,7 +76,7 @@ Feature: Update of relations by osm2pgsql
           r1 Ttype=multipolygon,tourism=hotel,name=XY Mw2@
           """
         Then place contains
-          | object | class   | type   | name |
+          | object | class   | type   | name!dict |
           | R1     | tourism | hotel  | 'name' : 'XY' |
         When updating osm data
           """
@@ -96,7 +95,7 @@ Feature: Update of relations by osm2pgsql
           r1 Ttype=multipolygon,tourism=hotel,name=XY Mw2@
           """
         Then place contains
-          | object | class   | type   | name |
+          | object | class   | type   | name!dict |
           | R1     | tourism | hotel  | 'name' : 'XY' |
         When updating osm data
           """
@@ -115,7 +114,7 @@ Feature: Update of relations by osm2pgsql
           r1 Ttype=multipolygon,tourism=hotel,name=XY Mw2@
           """
         Then place contains
-          | object | class   | type   | name |
+          | object | class   | type   | name!dict |
           | R1     | tourism | hotel  | 'name' : 'XY' |
         When updating osm data
           """
@@ -137,5 +136,5 @@ Feature: Update of relations by osm2pgsql
           r1 Ttype=boundary,boundary=administrative,name=Foo,country_code=XX,admin_level=2 Mw1@
           """
         Then place contains
-          | object | addr+country | name           |
-          | R1     | XX           | 'name' : 'Foo' |
+          | object | address+country | name!dict      |
+          | R1     | XX              | 'name' : 'Foo' |
diff --git a/test/bdd/features/osm2pgsql/update/simple.feature b/test/bdd/features/osm2pgsql/update/simple.feature
new file mode 100644
index 00000000..cc26f8bd
--- /dev/null
+++ b/test/bdd/features/osm2pgsql/update/simple.feature
@@ -0,0 +1,48 @@
+Feature: Update of simple objects by osm2pgsql
+    Testing basic update functions of osm2pgsql.
+
+    Scenario: Adding a new object
+        When loading osm data
+          """
+          n1 Tplace=town,name=Middletown
+          """
+        Then place contains exactly
+          | object | class | type | name+name  |
+          | N1     | place | town | Middletown |
+
+       When updating osm data
+         """
+         n2 Tamenity=hotel,name=Posthotel
+         """
+        Then place contains exactly
+          | object | class   | type  | name+name  |
+          | N1     | place   | town  | Middletown |
+          | N2     | amenity | hotel | Posthotel  |
+        And placex contains exactly
+          | object | class   | type  | name+name  | indexed_status |
+          | N1     | place   | town  | Middletown | 0              |
+          | N2     | amenity | hotel | Posthotel  | 1              |
+
+
+    Scenario: Deleting an existing object
+        When loading osm data
+          """
+          n1 Tplace=town,name=Middletown
+          n2 Tamenity=hotel,name=Posthotel
+          """
+        Then place contains exactly
+          | object | class   | type  | name+name  |
+          | N1     | place   | town  | Middletown |
+          | N2     | amenity | hotel | Posthotel  |
+
+       When updating osm data
+         """
+         n2 dD
+         """
+        Then place contains exactly
+          | object | class | type  | name+name  |
+          | N1     | place | town  | Middletown |
+        And placex contains exactly
+          | object | class   | type  | name+name  | indexed_status |
+          | N1     | place   | town  | Middletown | 0              |
+          | N2     | amenity | hotel | Posthotel  | 100            |
diff --git a/test/bdd/osm2pgsql/update/tags.feature b/test/bdd/features/osm2pgsql/update/tags.feature
similarity index 69%
rename from test/bdd/osm2pgsql/update/tags.feature
rename to test/bdd/features/osm2pgsql/update/tags.feature
index e2fd665a..371a5089 100644
--- a/test/bdd/osm2pgsql/update/tags.feature
+++ b/test/bdd/features/osm2pgsql/update/tags.feature
@@ -1,4 +1,3 @@
-@DB
 Feature: Tag evaluation
     Tests if tags are correctly updated in the place table
 
@@ -16,11 +15,11 @@ Feature: Tag evaluation
             n3 Tamenity=prison
             """
         Then place contains exactly
-            | object     | class   | type       |
-            | N1         | amenity | restaurant |
-            | N2:highway | highway | bus_stop   |
-            | N2:railway | railway | stop       |
-            | N3         | amenity | prison     |
+            | object | class   | type       |
+            | N1     | amenity | restaurant |
+            | N2     | highway | bus_stop   |
+            | N2     | railway | stop       |
+            | N3     | amenity | prison     |
 
         When updating osm data
             """
@@ -28,17 +27,17 @@ Feature: Tag evaluation
             n2 Thighway=bus_stop,name=X
             """
         Then place contains exactly
-            | object     | class   | type       |
-            | N2:highway | highway | bus_stop   |
-            | N3         | amenity | prison     |
+            | object | class   | type       |
+            | N2     | highway | bus_stop   |
+            | N3     | amenity | prison     |
         And placex contains
-            | object     | indexed_status |
-            | N3:amenity | 0              |
+            | object | class   | indexed_status |
+            | N3     | amenity | 0              |
         When indexing
         Then placex contains exactly
-            | object     | type     | name        |
-            | N2:highway | bus_stop | 'name': 'X' |
-            | N3:amenity | prison   | -           |
+            | object | class   | type     | name!dict   |
+            | N2     | highway | bus_stop | 'name': 'X' |
+            | N3     | amenity | prison   | -           |
 
 
     Scenario: Main tag added
@@ -48,8 +47,8 @@ Feature: Tag evaluation
             n2 Thighway=bus_stop,name=X
             """
         Then place contains exactly
-            | object     | class   | type       |
-            | N2:highway | highway | bus_stop   |
+            | object | class   | type       |
+            | N2     | highway | bus_stop   |
 
         When updating osm data
             """
@@ -57,16 +56,16 @@ Feature: Tag evaluation
             n2 Thighway=bus_stop,railway=stop,name=X
             """
         Then place contains exactly
-            | object     | class   | type       |
-            | N1         | amenity | restaurant |
-            | N2:highway | highway | bus_stop   |
-            | N2:railway | railway | stop       |
+            | object | class   | type       |
+            | N1     | amenity | restaurant |
+            | N2     | highway | bus_stop   |
+            | N2     | railway | stop       |
         When indexing
         Then placex contains exactly
-            | object     | type       | name        |
-            | N1:amenity | restaurant | -           |
-            | N2:highway | bus_stop   | 'name': 'X' |
-            | N2:railway | stop       | 'name': 'X' |
+            | object | class   | type       | name!dict   |
+            | N1     | amenity | restaurant | -           |
+            | N2     | highway | bus_stop   | 'name': 'X' |
+            | N2     | railway | stop       | 'name': 'X' |
 
 
     Scenario: Main tag modified
@@ -91,9 +90,9 @@ Feature: Tag evaluation
             | N11    | highway | primary |
         When indexing
         Then placex contains exactly
-            | object      | type       | name        |
-            | N10:highway | path       | 'name': 'X' |
-            | N11:highway | primary    | -           |
+            | object | class   | type       | name!dict   |
+            | N10    | highway | path       | 'name': 'X' |
+            | N11    | highway | primary    | -           |
 
 
     Scenario: Main tags with name, name added
@@ -116,9 +115,9 @@ Feature: Tag evaluation
             | N46    | building| yes     |
         When indexing
         Then placex contains exactly
-            | object      | type       | name           | address            |
-            | N45:landuse | cemetry    | 'name': 'TODO' | -                  |
-            | N46:building| yes        | -              | 'housenumber': '1' |
+            | object | class   | type       | name!dict      | address!dict       |
+            | N45    | landuse | cemetry    | 'name': 'TODO' | -                  |
+            | N46    | building| yes        | -              | 'housenumber': '1' |
 
 
     Scenario: Main tags with name, name removed
@@ -150,7 +149,7 @@ Feature: Tag evaluation
             n46 Tbuilding=yes,addr:housenumber=1
             """
         Then place contains exactly
-            | object | class   | type    | name            | address           |
+            | object | class   | type    | name!dict       | address!dict      |
             | N45    | landuse | cemetry | 'name' : 'TODO' | -                 |
             | N46    | building| yes     | -               | 'housenumber': '1'|
 
@@ -160,12 +159,12 @@ Feature: Tag evaluation
             n46 Tbuilding=yes,addr:housenumber=10
             """
         Then place contains exactly
-            | object | class   | type    | name            | address            |
+            | object | class   | type    | name!dict       | address!dict       |
             | N45    | landuse | cemetry | 'name' : 'DONE' | -                  |
             | N46    | building| yes     | -               | 'housenumber': '10'|
         When indexing
         Then placex contains exactly
-            | object | class   | type    | name            | address            |
+            | object | class   | type    | name!dict       | address!dict       |
             | N45    | landuse | cemetry | 'name' : 'DONE' | -                  |
             | N46    | building| yes     | -               | 'housenumber': '10'|
 
@@ -176,7 +175,7 @@ Feature: Tag evaluation
             n1 Taddr:housenumber=345
             """
         Then place contains exactly
-            | object | class | type  | address |
+            | object | class | type  | address!dict |
             | N1     | place | house | 'housenumber': '345'|
 
         When updating osm data
@@ -184,11 +183,11 @@ Feature: Tag evaluation
             n1 Taddr:housenumber=345,building=yes
             """
         Then place contains exactly
-            | object | class    | type  | address |
+            | object | class    | type  | address!dict |
             | N1     | building | yes   | 'housenumber': '345'|
         When indexing
         Then placex contains exactly
-            | object | class    | type  | address |
+            | object | class    | type  | address!dict |
             | N1     | building | yes   | 'housenumber': '345'|
 
 
@@ -198,7 +197,7 @@ Feature: Tag evaluation
             n1 Taddr:housenumber=345,building=yes
             """
         Then place contains exactly
-            | object | class    | type  | address |
+            | object | class    | type  | address!dict |
             | N1     | building | yes   | 'housenumber': '345'|
 
         When updating osm data
@@ -206,11 +205,11 @@ Feature: Tag evaluation
             n1 Taddr:housenumber=345
             """
         Then place contains exactly
-            | object | class | type  | address |
+            | object | class | type  | address!dict |
             | N1     | place | house | 'housenumber': '345'|
         When indexing
         Then placex contains exactly
-            | object | class | type  | address |
+            | object | class | type  | address!dict |
             | N1     | place | house | 'housenumber': '345'|
 
 
@@ -227,11 +226,11 @@ Feature: Tag evaluation
             n2 Tbridge=yes,bridge:name=high
             """
         Then place contains exactly
-            | object | class    | type  | name           |
+            | object | class    | type  | name!dict      |
             | N2     | bridge   | yes   | 'name': 'high' |
         When indexing
         Then placex contains exactly
-            | object | class    | type  | name           |
+            | object | class    | type  | name!dict      |
             | N2     | bridge   | yes   | 'name': 'high' |
 
 
@@ -241,7 +240,7 @@ Feature: Tag evaluation
             n2 Tbridge=yes,bridge:name=high
             """
         Then place contains exactly
-            | object | class    | type  | name           |
+            | object | class    | type  | name!dict      |
             | N2     | bridge   | yes   | 'name': 'high' |
 
         When updating osm data
@@ -261,7 +260,7 @@ Feature: Tag evaluation
             n2 Tbridge=yes,bridge:name=high
             """
         Then place contains exactly
-            | object | class    | type  | name           |
+            | object | class    | type  | name!dict      |
             | N2     | bridge   | yes   | 'name': 'high' |
 
         When updating osm data
@@ -269,11 +268,11 @@ Feature: Tag evaluation
             n2 Tbridge=yes,bridge:name:en=high
             """
         Then place contains exactly
-            | object | class  | type | name              |
+            | object | class  | type | name!dict         |
             | N2     | bridge | yes  | 'name:en': 'high' |
         When indexing
         Then placex contains exactly
-            | object | class  | type | name              |
+            | object | class  | type | name!dict         |
             | N2     | bridge | yes  | 'name:en': 'high' |
 
 
@@ -285,8 +284,8 @@ Feature: Tag evaluation
           w1 Thighway=residential Nn100,n101
           """
         Then place contains exactly
-          | object     |
-          | W1:highway |
+          | object | class |
+          | W1     | highway |
 
         When updating osm data
           """
@@ -314,12 +313,12 @@ Feature: Tag evaluation
           w1 Thighway=unclassified Nn100,n101
           """
         Then place contains exactly
-          | object     |
-          | W1:highway |
+          | object | class   |
+          | W1     | highway |
         When indexing
         Then placex contains exactly
-          | object     |
-          | W1:highway |
+          | object | class   |
+          | W1     | highway |
 
 
     Scenario: Downgrading a highway when a second tag is present
@@ -330,21 +329,21 @@ Feature: Tag evaluation
           w1 Thighway=residential,tourism=hotel Nn100,n101
           """
         Then place contains exactly
-          | object     | type        |
-          | W1:highway | residential |
-          | W1:tourism | hotel       |
+          | object | class   | type        |
+          | W1     | highway | residential |
+          | W1     | tourism | hotel       |
 
         When updating osm data
           """
           w1 Thighway=service,tourism=hotel Nn100,n101
           """
         Then place contains exactly
-          | object     | type  |
-          | W1:tourism | hotel |
+          | object | class   | type  |
+          | W1     | tourism | hotel |
         When indexing
         Then placex contains exactly
-          | object     | type  |
-          | W1:tourism | hotel |
+          | object | class   | type  |
+          | W1     | tourism | hotel |
 
 
     Scenario: Upgrading a highway when a second tag is present
@@ -355,22 +354,22 @@ Feature: Tag evaluation
           w1 Thighway=service,tourism=hotel Nn100,n101
           """
         Then place contains exactly
-          | object     | type  |
-          | W1:tourism | hotel |
+          | object | class   | type  |
+          | W1     | tourism | hotel |
 
         When updating osm data
           """
           w1 Thighway=residential,tourism=hotel Nn100,n101
           """
         Then place contains exactly
-          | object     | type        |
-          | W1:highway | residential |
-          | W1:tourism | hotel       |
+          | object | class   | type        |
+          | W1     | highway | residential |
+          | W1     | tourism | hotel       |
         When indexing
         Then placex contains exactly
-          | object     | type        |
-          | W1:highway | residential |
-          | W1:tourism | hotel       |
+          | object | class   | type        |
+          | W1     | highway | residential |
+          | W1     | tourism | hotel       |
 
 
     Scenario: Replay on administrative boundary
@@ -382,22 +381,22 @@ Feature: Tag evaluation
           w10 Tboundary=administrative,waterway=river,name=Border,admin_level=2 Nn12,n11,n10
           """
         Then place contains exactly
-          | object       | type           | admin_level | name             |
-          | W10:waterway | river          | 2           | 'name': 'Border' |
-          | W10:boundary | administrative | 2           | 'name': 'Border' |
+          | object | class    | type           | admin_level | name!dict        |
+          | W10    | waterway | river          | 2           | 'name': 'Border' |
+          | W10    | boundary | administrative | 2           | 'name': 'Border' |
 
         When updating osm data
           """
           w10 Tboundary=administrative,waterway=river,name=Border,admin_level=2 Nn12,n11,n10
           """
         Then place contains exactly
-          | object       | type           | admin_level | name             |
-          | W10:waterway | river          | 2           | 'name': 'Border' |
-          | W10:boundary | administrative | 2           | 'name': 'Border' |
+          | object | class    | type           | admin_level | name!dict        |
+          | W10    | waterway | river          | 2           | 'name': 'Border' |
+          | W10    | boundary | administrative | 2           | 'name': 'Border' |
         When indexing
         Then placex contains exactly
-          | object       | type           | admin_level | name             |
-          | W10:waterway | river          | 2           | 'name': 'Border' |
+          | object | class    | type           | admin_level | name!dict        |
+          | W10    | waterway | river          | 2           | 'name': 'Border' |
 
 
     Scenario: Change admin_level on administrative boundary
@@ -414,20 +413,20 @@ Feature: Tag evaluation
           r10 Ttype=multipolygon,boundary=administrative,name=Border,admin_level=2 Mw10@
           """
         Then place contains exactly
-          | object       | admin_level |
-          | R10:boundary | 2           |
+          | object | class    | admin_level |
+          | R10    | boundary | 2           |
 
         When updating osm data
           """
           r10 Ttype=multipolygon,boundary=administrative,name=Border,admin_level=4 Mw10@
           """
         Then place contains exactly
-          | object       | type           | admin_level |
-          | R10:boundary | administrative | 4           |
+          | object | class    | type           | admin_level |
+          | R10    | boundary | administrative | 4           |
         When indexing
         Then placex contains exactly
-          | object       | type           | admin_level |
-          | R10:boundary | administrative | 4           |
+          | object | class    | type           | admin_level |
+          | R10    | boundary | administrative | 4           |
 
 
     Scenario: Change boundary to administrative
@@ -444,20 +443,20 @@ Feature: Tag evaluation
           r10 Ttype=multipolygon,boundary=informal,name=Border,admin_level=4 Mw10@
           """
         Then place contains exactly
-          | object       | type     | admin_level |
-          | R10:boundary | informal | 4           |
+          | object | class    | type     | admin_level |
+          | R10    | boundary | informal | 4           |
 
         When updating osm data
           """
           r10 Ttype=multipolygon,boundary=administrative,name=Border,admin_level=4 Mw10@
           """
         Then place contains exactly
-          | object       | type           | admin_level |
-          | R10:boundary | administrative | 4           |
+          | object | class    | type           | admin_level |
+          | R10    | boundary | administrative | 4           |
         When indexing
         Then placex contains exactly
-          | object       | type           | admin_level |
-          | R10:boundary | administrative | 4           |
+          | object | class    | type           | admin_level |
+          | R10    | boundary | administrative | 4           |
 
 
     Scenario: Change boundary away from administrative
@@ -474,20 +473,20 @@ Feature: Tag evaluation
           r10 Ttype=multipolygon,boundary=administrative,name=Border,admin_level=4 Mw10@
           """
         Then place contains exactly
-          | object       | type           | admin_level |
-          | R10:boundary | administrative | 4           |
+          | object | class    | type           | admin_level |
+          | R10    | boundary | administrative | 4           |
 
         When updating osm data
           """
           r10 Ttype=multipolygon,boundary=informal,name=Border,admin_level=4 Mw10@
           """
         Then place contains exactly
-          | object       | type     | admin_level |
-          | R10:boundary | informal | 4           |
+          | object | class    | type     | admin_level |
+          | R10    | boundary | informal | 4           |
         When indexing
         Then placex contains exactly
-          | object       | type     | admin_level |
-          | R10:boundary | informal | 4           |
+          | object | class    | type     | admin_level |
+          | R10    | boundary | informal | 4           |
 
 
     Scenario: Main tag and geometry is changed
@@ -500,8 +499,8 @@ Feature: Tag evaluation
           w5 Tbuilding=house,name=Foo Nn1,n2,n3,n4,n1
           """
         Then place contains exactly
-          | object      | type  |
-          | W5:building | house |
+          | object | class    | type  |
+          | W5     | building | house |
 
         When updating osm data
           """
@@ -509,5 +508,5 @@ Feature: Tag evaluation
           w5 Tbuilding=terrace,name=Bar Nn1,n2,n3,n4,n1
           """
         Then place contains exactly
-          | object      | type    |
-          | W5:building | terrace |
+          | object | class    | type    |
+          | W5     | building | terrace |
diff --git a/test/bdd/osm2pgsql/update/simple.feature b/test/bdd/osm2pgsql/update/simple.feature
deleted file mode 100644
index 5a86917c..00000000
--- a/test/bdd/osm2pgsql/update/simple.feature
+++ /dev/null
@@ -1,49 +0,0 @@
-@DB
-Feature: Update of simple objects by osm2pgsql
-    Testing basic update functions of osm2pgsql.
-
-    Scenario: Adding a new object
-        When loading osm data
-          """
-          n1 Tplace=town,name=Middletown
-          """
-        Then place contains exactly
-          | object   | type | name+name  |
-          | N1:place | town | Middletown |
-
-       When updating osm data
-         """
-         n2 Tamenity=hotel,name=Posthotel
-         """
-        Then place contains exactly
-          | object     | type  | name+name  |
-          | N1:place   | town  | Middletown |
-          | N2:amenity | hotel | Posthotel  |
-        And placex contains exactly
-          | object     | type  | name+name  | indexed_status |
-          | N1:place   | town  | Middletown | 0              |
-          | N2:amenity | hotel | Posthotel  | 1              |
-
-
-    Scenario: Deleting an existing object
-        When loading osm data
-          """
-          n1 Tplace=town,name=Middletown
-          n2 Tamenity=hotel,name=Posthotel
-          """
-        Then place contains exactly
-          | object     | type  | name+name  |
-          | N1:place   | town  | Middletown |
-          | N2:amenity | hotel | Posthotel  |
-
-       When updating osm data
-         """
-         n2 dD
-         """
-        Then place contains exactly
-          | object     | type  | name+name  |
-          | N1:place   | town  | Middletown |
-        And placex contains exactly
-          | object     | type  | name+name  | indexed_status |
-          | N1:place   | town  | Middletown | 0              |
-          | N2:amenity | hotel | Posthotel  | 100            |
diff --git a/test/bdd/steps/check_functions.py b/test/bdd/steps/check_functions.py
deleted file mode 100644
index 49676896..00000000
--- a/test/bdd/steps/check_functions.py
+++ /dev/null
@@ -1,113 +0,0 @@
-# SPDX-License-Identifier: GPL-2.0-only
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2023 by the Nominatim developer community.
-# For a full list of authors see the git log.
-"""
-Collection of assertion functions used for the steps.
-"""
-import json
-import math
-import re
-
-class Almost:
-    """ Compares a float value with a certain jitter.
-    """
-    def __init__(self, value, offset=0.00001):
-        self.value = value
-        self.offset = offset
-
-    def __eq__(self, other):
-        return abs(other - self.value) < self.offset
-
-
-OSM_TYPE = {'N' : 'node', 'W' : 'way', 'R' : 'relation',
-            'n' : 'node', 'w' : 'way', 'r' : 'relation',
-            'node' : 'n', 'way' : 'w', 'relation' : 'r'}
-
-
-class OsmType:
-    """ Compares an OSM type, accepting both N/R/W and node/way/relation.
-    """
-
-    def __init__(self, value):
-        self.value = value
-
-
-    def __eq__(self, other):
-        return other == self.value or other == OSM_TYPE[self.value]
-
-
-    def __str__(self):
-        return f"{self.value} or {OSM_TYPE[self.value]}"
-
-
-class Field:
-    """ Generic comparator for fields, which looks at the type of the
-        value compared.
-    """
-    def __init__(self, value, **extra_args):
-        self.value = value
-        self.extra_args = extra_args
-
-    def __eq__(self, other):
-        if isinstance(self.value, float):
-            return math.isclose(self.value, float(other), **self.extra_args)
-
-        if self.value.startswith('^'):
-            return re.fullmatch(self.value, str(other))
-
-        if isinstance(other, dict):
-            return other == eval('{' + self.value + '}')
-
-        return str(self.value) == str(other)
-
-    def __str__(self):
-        return str(self.value)
-
-
-class Bbox:
-    """ Comparator for bounding boxes.
-    """
-    def __init__(self, bbox_string):
-        self.coord = [float(x) for x in bbox_string.split(',')]
-
-    def __contains__(self, item):
-        if isinstance(item, str):
-            item = item.split(',')
-        item = list(map(float, item))
-
-        if len(item) == 2:
-            return self.coord[0] <= item[0] <= self.coord[2] \
-                   and self.coord[1] <= item[1] <= self.coord[3]
-
-        if len(item) == 4:
-            return item[0] >= self.coord[0] and item[1] <= self.coord[1] \
-                   and item[2] >= self.coord[2] and item[3] <= self.coord[3]
-
-        raise ValueError("Not a coordinate or bbox.")
-
-    def __str__(self):
-        return str(self.coord)
-
-
-
-def check_for_attributes(obj, attrs, presence='present'):
-    """ Check that the object has the given attributes. 'attrs' is a
-        string with a comma-separated list of attributes. If 'presence'
-        is set to 'absent' then the function checks that the attributes do
-        not exist for the object
-    """
-    def _dump_json():
-        return json.dumps(obj, sort_keys=True, indent=2, ensure_ascii=False)
-
-    for attr in attrs.split(','):
-        attr = attr.strip()
-        if presence == 'absent':
-            assert attr not in obj, \
-                   f"Unexpected attribute {attr}. Full response:\n{_dump_json()}"
-        else:
-            assert attr in obj, \
-                   f"No attribute '{attr}'. Full response:\n{_dump_json()}"
-
diff --git a/test/bdd/steps/geometry_alias.py b/test/bdd/steps/geometry_alias.py
deleted file mode 100644
index a9b4ec8c..00000000
--- a/test/bdd/steps/geometry_alias.py
+++ /dev/null
@@ -1,262 +0,0 @@
-# SPDX-License-Identifier: GPL-2.0-only
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2022 by the Nominatim developer community.
-# For a full list of authors see the git log.
-"""
-Collection of aliases for various world coordinates.
-"""
-
-ALIASES = {
-# Country aliases
-'AD': (1.58972, 42.54241),
-'AE': (54.61589, 24.82431),
-'AF': (65.90264, 34.84708),
-'AG': (-61.72430, 17.069),
-'AI': (-63.10571, 18.25461),
-'AL': (19.84941, 40.21232),
-'AM': (44.64229, 40.37821),
-'AO': (16.21924, -12.77014),
-'AQ': (44.99999, -75.65695),
-'AR': (-61.10759, -34.37615),
-'AS': (-170.68470, -14.29307),
-'AT': (14.25747, 47.36542),
-'AU': (138.23155, -23.72068),
-'AW': (-69.98255, 12.555),
-'AX': (19.91839, 59.81682),
-'AZ': (48.38555, 40.61639),
-'BA': (17.18514, 44.25582),
-'BB': (-59.53342, 13.19),
-'BD': (89.75989, 24.34205),
-'BE': (4.90078, 50.34682),
-'BF': (-0.56743, 11.90471),
-'BG': (24.80616, 43.09859),
-'BH': (50.52032, 25.94685),
-'BI': (29.54561, -2.99057),
-'BJ': (2.70062, 10.02792),
-'BL': (-62.79349, 17.907),
-'BM': (-64.77406, 32.30199),
-'BN': (114.52196, 4.28638),
-'BO': (-62.02473, -17.77723),
-'BQ': (-63.14322, 17.566),
-'BR': (-45.77065, -9.58685),
-'BS': (-77.60916, 23.8745),
-'BT': (90.01350, 27.28137),
-'BV': (3.35744, -54.4215),
-'BW': (23.51505, -23.48391),
-'BY': (26.77259, 53.15885),
-'BZ': (-88.63489, 16.33951),
-'CA': (-107.74817, 67.12612),
-'CC': (96.84420, -12.01734),
-'CD': (24.09544, -1.67713),
-'CF': (22.58701, 5.98438),
-'CG': (15.78875, 0.40388),
-'CH': (7.65705, 46.57446),
-'CI': (-6.31190, 6.62783),
-'CK': (-159.77835, -21.23349),
-'CL': (-70.41790, -53.77189),
-'CM': (13.26022, 5.94519),
-'CN': (96.44285, 38.04260),
-'CO': (-72.52951, 2.45174),
-'CR': (-83.83314, 9.93514),
-'CU': (-80.81673, 21.88852),
-'CV': (-24.50810, 14.929),
-'CW': (-68.96409, 12.1845),
-'CX': (105.62411, -10.48417),
-'CY': (32.95922, 35.37010),
-'CZ': (16.32098, 49.50692),
-'DE': (9.30716, 50.21289),
-'DJ': (42.96904, 11.41542),
-'DK': (9.18490, 55.98916),
-'DM': (-61.00358, 15.65470),
-'DO': (-69.62855, 18.58841),
-'DZ': (4.24749, 25.79721),
-'EC': (-77.45831, -0.98284),
-'EE': (23.94288, 58.43952),
-'EG': (28.95293, 28.17718),
-'EH': (-13.69031, 25.01241),
-'ER': (39.01223, 14.96033),
-'ES': (-2.59110, 38.79354),
-'ET': (38.61697, 7.71399),
-'FI': (26.89798, 63.56194),
-'FJ': (177.91853, -17.74237),
-'FK': (-58.99044, -51.34509),
-'FM': (151.95358, 8.5045),
-'FO': (-6.60483, 62.10000),
-'FR': (0.28410, 47.51045),
-'GA': (10.81070, -0.07429),
-'GB': (-0.92823, 52.01618),
-'GD': (-61.64524, 12.191),
-'GE': (44.16664, 42.00385),
-'GF': (-53.46524, 3.56188),
-'GG': (-2.50580, 49.58543),
-'GH': (-0.46348, 7.16051),
-'GI': (-5.32053, 36.11066),
-'GL': (-33.85511, 74.66355),
-'GM': (-16.40960, 13.25),
-'GN': (-13.83940, 10.96291),
-'GP': (-61.68712, 16.23049),
-'GQ': (10.23973, 1.43119),
-'GR': (23.17850, 39.06206),
-'GS': (-36.49430, -54.43067),
-'GT': (-90.74368, 15.20428),
-'GU': (144.73362, 13.44413),
-'GW': (-14.83525, 11.92486),
-'GY': (-58.45167, 5.73698),
-'HK': (114.18577, 22.34923),
-'HM': (73.68230, -53.22105),
-'HN': (-86.95414, 15.23820),
-'HR': (17.49966, 45.52689),
-'HT': (-73.51925, 18.32492),
-'HU': (20.35362, 47.51721),
-'ID': (123.34505, -0.83791),
-'IE': (-9.00520, 52.87725),
-'IL': (35.46314, 32.86165),
-'IM': (-4.86740, 54.023),
-'IN': (88.67620, 27.86155),
-'IO': (71.42743, -6.14349),
-'IQ': (42.58109, 34.26103),
-'IR': (56.09355, 30.46751),
-'IS': (-17.51785, 64.71687),
-'IT': (10.42639, 44.87904),
-'JE': (-2.19261, 49.12458),
-'JM': (-76.84020, 18.3935),
-'JO': (36.55552, 30.75741),
-'JP': (138.72531, 35.92099),
-'KE': (36.90602, 1.08512),
-'KG': (76.15571, 41.66497),
-'KH': (104.31901, 12.95555),
-'KI': (173.63353, 0.139),
-'KM': (44.31474, -12.241),
-'KN': (-62.69379, 17.2555),
-'KP': (126.65575, 39.64575),
-'KR': (127.27740, 36.41388),
-'KW': (47.30684, 29.69180),
-'KY': (-81.07455, 19.29949),
-'KZ': (72.00811, 49.88855),
-'LA': (102.44391, 19.81609),
-'LB': (35.48464, 33.41766),
-'LC': (-60.97894, 13.891),
-'LI': (9.54693, 47.15934),
-'LK': (80.38520, 8.41649),
-'LR': (-11.16960, 4.04122),
-'LS': (28.66984, -29.94538),
-'LT': (24.51735, 55.49293),
-'LU': (6.08649, 49.81533),
-'LV': (23.51033, 56.67144),
-'LY': (15.36841, 28.12177),
-'MA': (-4.03061, 33.21696),
-'MC': (7.47743, 43.62917),
-'MD': (29.61725, 46.66517),
-'ME': (19.72291, 43.02441),
-'MF': (-63.06666, 18.08102),
-'MG': (45.86378, -20.50245),
-'MH': (171.94982, 5.983),
-'MK': (21.42108, 41.08980),
-'ML': (-1.93310, 16.46993),
-'MM': (95.54624, 21.09620),
-'MN': (99.81138, 48.18615),
-'MO': (113.56441, 22.16209),
-'MP': (145.21345, 14.14902),
-'MQ': (-60.81128, 14.43706),
-'MR': (-9.42324, 22.59251),
-'MS': (-62.19455, 16.745),
-'MT': (14.38363, 35.94467),
-'MU': (57.55121, -20.41),
-'MV': (73.39292, 4.19375),
-'MW': (33.95722, -12.28218),
-'MX': (-105.89221, 25.86826),
-'MY': (112.71154, 2.10098),
-'MZ': (37.58689, -13.72682),
-'NA': (16.68569, -21.46572),
-'NC': (164.95322, -20.38889),
-'NE': (10.06041, 19.08273),
-'NF': (167.95718, -29.0645),
-'NG': (10.17781, 10.17804),
-'NI': (-85.87974, 13.21715),
-'NL': (-68.57062, 12.041),
-'NO': (23.11556, 70.09934),
-'NP': (83.36259, 28.13107),
-'NR': (166.93479, -0.5275),
-'NU': (-169.84873, -19.05305),
-'NZ': (167.97209, -45.13056),
-'OM': (56.86055, 20.47413),
-'PA': (-79.40160, 8.80656),
-'PE': (-78.66540, -7.54711),
-'PF': (-145.05719, -16.70862),
-'PG': (146.64600, -7.37427),
-'PH': (121.48359, 15.09965),
-'PK': (72.11347, 31.14629),
-'PL': (17.88136, 52.77182),
-'PM': (-56.19515, 46.78324),
-'PN': (-130.10642, -25.06955),
-'PR': (-65.88755, 18.37169),
-'PS': (35.39801, 32.24773),
-'PT': (-8.45743, 40.11154),
-'PW': (134.49645, 7.3245),
-'PY': (-59.51787, -22.41281),
-'QA': (51.49903, 24.99816),
-'RE': (55.77345, -21.36388),
-'RO': (26.37632, 45.36120),
-'RS': (20.40371, 44.56413),
-'RU': (116.44060, 59.06780),
-'RW': (29.57882, -1.62404),
-'SA': (47.73169, 22.43790),
-'SB': (164.63894, -10.23606),
-'SC': (46.36566, -9.454),
-'SD': (28.14720, 14.56423),
-'SE': (15.68667, 60.35568),
-'SG': (103.84187, 1.304),
-'SH': (-12.28155, -37.11546),
-'SI': (14.04738, 46.39085),
-'SJ': (15.27552, 79.23365),
-'SK': (20.41603, 48.86970),
-'SL': (-11.47773, 8.78156),
-'SM': (12.46062, 43.94279),
-'SN': (-15.37111, 14.99477),
-'SO': (46.93383, 9.34094),
-'SR': (-55.42864, 4.56985),
-'SS': (28.13573, 8.50933),
-'ST': (6.61025, 0.2215),
-'SV': (-89.36665, 13.43072),
-'SX': (-63.15393, 17.9345),
-'SY': (38.15513, 35.34221),
-'SZ': (31.78263, -26.14244),
-'TC': (-71.32554, 21.35),
-'TD': (17.42092, 13.46223),
-'TF': (137.5, -67.5),
-'TG': (1.06983, 7.87677),
-'TH': (102.00877, 16.42310),
-'TJ': (71.91349, 39.01527),
-'TK': (-171.82603, -9.20990),
-'TL': (126.22520, -8.72636),
-'TM': (57.71603, 39.92534),
-'TN': (9.04958, 34.84199),
-'TO': (-176.99320, -23.11104),
-'TR': (32.82002, 39.86350),
-'TT': (-60.70793, 11.1385),
-'TV': (178.77499, -9.41685),
-'TW': (120.30074, 23.17002),
-'TZ': (33.53892, -5.01840),
-'UA': (33.44335, 49.30619),
-'UG': (32.96523, 2.08584),
-'UM': (-169.50993, 16.74605),
-'US': (-116.39535, 40.71379),
-'UY': (-56.46505, -33.62658),
-'UZ': (61.35529, 42.96107),
-'VA': (12.33197, 42.04931),
-'VC': (-61.09905, 13.316),
-'VE': (-64.88323, 7.69849),
-'VG': (-64.62479, 18.419),
-'VI': (-64.88950, 18.32263),
-'VN': (104.20179, 10.27644),
-'VU': (167.31919, -15.88687),
-'WF': (-176.20781, -13.28535),
-'WS': (-172.10966, -13.85093),
-'YE': (45.94562, 16.16338),
-'YT': (44.93774, -12.60882),
-'ZA': (23.19488, -30.43276),
-'ZM': (26.38618, -14.39966),
-'ZW': (30.12419, -19.86907)
-}
diff --git a/test/bdd/steps/geometry_factory.py b/test/bdd/steps/geometry_factory.py
deleted file mode 100644
index 19c0406c..00000000
--- a/test/bdd/steps/geometry_factory.py
+++ /dev/null
@@ -1,94 +0,0 @@
-# SPDX-License-Identifier: GPL-2.0-only
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2022 by the Nominatim developer community.
-# For a full list of authors see the git log.
-from pathlib import Path
-import os
-
-from steps.geometry_alias import ALIASES
-
-class GeometryFactory:
-    """ Provides functions to create geometries from coordinates and data grids.
-    """
-
-    def __init__(self):
-        self.grid = {}
-
-    def parse_geometry(self, geom):
-        """ Create a WKT SQL term for the given geometry.
-            The function understands the following formats:
-
-              country:<country code>
-                 Point geometry guaranteed to be in the given country
-              <P>
-                 Point geometry
-              <P>,...,<P>
-                 Line geometry
-              (<P>,...,<P>)
-                 Polygon geometry
-
-           <P> may either be a coordinate of the form '<x> <y>' or a single
-           number. In the latter case it must refer to a point in
-           a previously defined grid.
-        """
-        if geom.startswith('country:'):
-            ccode = geom[8:].upper()
-            assert ccode in ALIASES, "Geometry error: unknown country " + ccode
-            return "ST_SetSRID('POINT({} {})'::geometry, 4326)".format(*ALIASES[ccode])
-
-        if geom.find(',') < 0:
-            out = "POINT({})".format(self.mk_wkt_point(geom))
-        elif geom.find('(') < 0:
-            out = "LINESTRING({})".format(self.mk_wkt_points(geom))
-        else:
-            out = "POLYGON(({}))".format(self.mk_wkt_points(geom.strip('() ')))
-
-        return "ST_SetSRID('{}'::geometry, 4326)".format(out)
-
-
-    def mk_wkt_point(self, point):
-        """ Parse a point description.
-            The point may either consist of 'x y' coordinates or a number
-            that refers to a grid setup.
-        """
-        geom = point.strip()
-        if geom.find(' ') >= 0:
-            return geom
-
-        try:
-            pt = self.grid_node(int(geom))
-        except ValueError:
-            assert False, "Scenario error: Point '{}' is not a number".format(geom)
-
-        assert pt is not None, "Scenario error: Point '{}' not found in grid".format(geom)
-        return "{} {}".format(*pt)
-
-
-    def mk_wkt_points(self, geom):
-        """ Parse a list of points.
-            The list must be a comma-separated list of points. Points
-            in coordinate and grid format may be mixed.
-        """
-        return ','.join([self.mk_wkt_point(x) for x in geom.split(',')])
-
-
-    def set_grid(self, lines, grid_step, origin=(0.0, 0.0)):
-        """ Replace the grid with one from the given lines.
-        """
-        self.grid = {}
-        y = origin[1]
-        for line in lines:
-            x = origin[0]
-            for pt_id in line:
-                if pt_id.isdigit():
-                    self.grid[int(pt_id)] = (x, y)
-                x += grid_step
-            y += grid_step
-
-
-    def grid_node(self, nodeid):
-        """ Get the coordinates for the given grid node.
-        """
-        return self.grid.get(nodeid)
diff --git a/test/bdd/steps/http_responses.py b/test/bdd/steps/http_responses.py
deleted file mode 100644
index 2e24ed50..00000000
--- a/test/bdd/steps/http_responses.py
+++ /dev/null
@@ -1,259 +0,0 @@
-# SPDX-License-Identifier: GPL-2.0-only
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2023 by the Nominatim developer community.
-# For a full list of authors see the git log.
-"""
-Classes wrapping HTTP responses from the Nominatim API.
-"""
-import re
-import json
-import xml.etree.ElementTree as ET
-
-from check_functions import Almost, OsmType, Field, check_for_attributes
-
-
-class GenericResponse:
-    """ Common base class for all API responses.
-    """
-    def __init__(self, page, fmt, errorcode=200):
-        fmt = fmt.strip()
-        if fmt == 'jsonv2':
-            fmt = 'json'
-
-        self.page = page
-        self.format = fmt
-        self.errorcode = errorcode
-        self.result = []
-        self.header = dict()
-
-        if errorcode == 200 and fmt != 'debug':
-            getattr(self, '_parse_' + fmt)()
-
-    def _parse_json(self):
-        m = re.fullmatch(r'([\w$][^(]*)\((.*)\)', self.page)
-        if m is None:
-            code = self.page
-        else:
-            code = m.group(2)
-            self.header['json_func'] = m.group(1)
-        self.result = json.JSONDecoder().decode(code)
-        if isinstance(self.result, dict):
-            if 'error' in self.result:
-                self.result = []
-            else:
-                self.result = [self.result]
-
-
-    def _parse_geojson(self):
-        self._parse_json()
-        if self.result:
-            geojson = self.result[0]
-            # check for valid geojson
-            check_for_attributes(geojson, 'type,features')
-            assert geojson['type'] == 'FeatureCollection'
-            assert isinstance(geojson['features'], list)
-
-            self.result = []
-            for result in geojson['features']:
-                check_for_attributes(result, 'type,properties,geometry')
-                assert result['type'] == 'Feature'
-                new = result['properties']
-                check_for_attributes(new, 'geojson', 'absent')
-                new['geojson'] = result['geometry']
-                if 'bbox' in result:
-                    check_for_attributes(new, 'boundingbox', 'absent')
-                    # bbox is  minlon, minlat, maxlon, maxlat
-                    # boundingbox is minlat, maxlat, minlon, maxlon
-                    new['boundingbox'] = [result['bbox'][1],
-                                          result['bbox'][3],
-                                          result['bbox'][0],
-                                          result['bbox'][2]]
-                for k, v in geojson.items():
-                    if k not in ('type', 'features'):
-                        check_for_attributes(new, '__' + k, 'absent')
-                        new['__' + k] = v
-                self.result.append(new)
-
-
-    def _parse_geocodejson(self):
-        self._parse_geojson()
-        if self.result:
-            for r in self.result:
-                assert set(r.keys()) == {'geocoding', 'geojson', '__geocoding'}, \
-                       f"Unexpected keys in result: {r.keys()}"
-                check_for_attributes(r['geocoding'], 'geojson', 'absent')
-                inner = r.pop('geocoding')
-                r.update(inner)
-
-
-    def assert_address_field(self, idx, field, value):
-        """ Check that result rows`idx` has a field `field` with value `value`
-            in its address. If idx is None, then all results are checked.
-        """
-        if idx is None:
-            todo = range(len(self.result))
-        else:
-            todo = [int(idx)]
-
-        for idx in todo:
-            self.check_row(idx, 'address' in self.result[idx], "No field 'address'")
-
-            address = self.result[idx]['address']
-            self.check_row_field(idx, field, value, base=address)
-
-
-    def match_row(self, row, context=None, field=None):
-        """ Match the result fields against the given behave table row.
-        """
-        if 'ID' in row.headings:
-            todo = [int(row['ID'])]
-        else:
-            todo = range(len(self.result))
-
-        for i in todo:
-            subdict = self.result[i]
-            if field is not None:
-                for key in field.split('.'):
-                    self.check_row(i, key in subdict, f"Missing subfield {key}")
-                    subdict = subdict[key]
-                    self.check_row(i, isinstance(subdict, dict),
-                                   f"Subfield {key} not a dict")
-
-            for name, value in zip(row.headings, row.cells):
-                if name == 'ID':
-                    pass
-                elif name == 'osm':
-                    self.check_row_field(i, 'osm_type', OsmType(value[0]), base=subdict)
-                    self.check_row_field(i, 'osm_id', Field(value[1:]), base=subdict)
-                elif name == 'centroid':
-                    if ' ' in value:
-                        lon, lat = value.split(' ')
-                    elif context is not None:
-                        lon, lat = context.osm.grid_node(int(value))
-                    else:
-                        raise RuntimeError("Context needed when using grid coordinates")
-                    self.check_row_field(i, 'lat', Field(float(lat), abs_tol=1e-07), base=subdict)
-                    self.check_row_field(i, 'lon', Field(float(lon), abs_tol=1e-07), base=subdict)
-                else:
-                    self.check_row_field(i, name, Field(value), base=subdict)
-
-
-    def check_row(self, idx, check, msg):
-        """ Assert for the condition 'check' and print 'msg' on fail together
-            with the contents of the failing result.
-        """
-        class _RowError:
-            def __init__(self, row):
-                self.row = row
-
-            def __str__(self):
-                return f"{msg}. Full row {idx}:\n" \
-                       + json.dumps(self.row, indent=4, ensure_ascii=False)
-
-        assert check, _RowError(self.result[idx])
-
-
-    def check_row_field(self, idx, field, expected, base=None):
-        """ Check field 'field' of result 'idx' for the expected value
-            and print a meaningful error if the condition fails.
-            When 'base' is set to a dictionary, then the field is checked
-            in that base. The error message will still report the contents
-            of the full result.
-        """
-        if base is None:
-            base = self.result[idx]
-
-        self.check_row(idx, field in base, f"No field '{field}'")
-        value = base[field]
-
-        self.check_row(idx, expected == value,
-                       f"\nBad value for field '{field}'. Expected: {expected}, got: {value}")
-
-
-
-class SearchResponse(GenericResponse):
-    """ Specialised class for search and lookup responses.
-        Transforms the xml response in a format similar to json.
-    """
-
-    def _parse_xml(self):
-        xml_tree = ET.fromstring(self.page)
-
-        self.header = dict(xml_tree.attrib)
-
-        for child in xml_tree:
-            assert child.tag == "place"
-            self.result.append(dict(child.attrib))
-
-            address = {}
-            for sub in child:
-                if sub.tag == 'extratags':
-                    self.result[-1]['extratags'] = {}
-                    for tag in sub:
-                        self.result[-1]['extratags'][tag.attrib['key']] = tag.attrib['value']
-                elif sub.tag == 'namedetails':
-                    self.result[-1]['namedetails'] = {}
-                    for tag in sub:
-                        self.result[-1]['namedetails'][tag.attrib['desc']] = tag.text
-                elif sub.tag == 'geokml':
-                    self.result[-1][sub.tag] = True
-                else:
-                    address[sub.tag] = sub.text
-
-            if address:
-                self.result[-1]['address'] = address
-
-
-class ReverseResponse(GenericResponse):
-    """ Specialised class for reverse responses.
-        Transforms the xml response in a format similar to json.
-    """
-
-    def _parse_xml(self):
-        xml_tree = ET.fromstring(self.page)
-
-        self.header = dict(xml_tree.attrib)
-        self.result = []
-
-        for child in xml_tree:
-            if child.tag == 'result':
-                assert not self.result, "More than one result in reverse result"
-                self.result.append(dict(child.attrib))
-                check_for_attributes(self.result[0], 'display_name', 'absent')
-                self.result[0]['display_name'] = child.text
-            elif child.tag == 'addressparts':
-                assert 'address' not in self.result[0], "More than one address in result"
-                address = {}
-                for sub in child:
-                    assert len(sub) == 0, f"Address element '{sub.tag}' has subelements"
-                    address[sub.tag] = sub.text
-                self.result[0]['address'] = address
-            elif child.tag == 'extratags':
-                assert 'extratags' not in self.result[0], "More than one extratags in result"
-                self.result[0]['extratags'] = {}
-                for tag in child:
-                    assert len(tag) == 0, f"Extratags element '{tag.attrib['key']}' has subelements"
-                    self.result[0]['extratags'][tag.attrib['key']] = tag.attrib['value']
-            elif child.tag == 'namedetails':
-                assert 'namedetails' not in self.result[0], "More than one namedetails in result"
-                self.result[0]['namedetails'] = {}
-                for tag in child:
-                    assert len(tag) == 0, f"Namedetails element '{tag.attrib['desc']}' has subelements"
-                    self.result[0]['namedetails'][tag.attrib['desc']] = tag.text
-            elif child.tag == 'geokml':
-                assert 'geokml' not in self.result[0], "More than one geokml in result"
-                self.result[0]['geokml'] = ET.tostring(child, encoding='unicode')
-            else:
-                assert child.tag == 'error', \
-                       f"Unknown XML tag {child.tag} on page: {self.page}"
-
-
-class StatusResponse(GenericResponse):
-    """ Specialised class for status responses.
-        Can also parse text responses.
-    """
-
-    def _parse_text(self):
-        pass
diff --git a/test/bdd/steps/nominatim_environment.py b/test/bdd/steps/nominatim_environment.py
deleted file mode 100644
index ba19bb48..00000000
--- a/test/bdd/steps/nominatim_environment.py
+++ /dev/null
@@ -1,331 +0,0 @@
-# SPDX-License-Identifier: GPL-3.0-or-later
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2024 by the Nominatim developer community.
-# For a full list of authors see the git log.
-from pathlib import Path
-import importlib
-import tempfile
-
-import psycopg
-from psycopg import sql as pysql
-
-from nominatim_db import cli
-from nominatim_db.config import Configuration
-from nominatim_db.db.connection import Connection, register_hstore, execute_scalar
-from nominatim_db.tools import refresh
-from nominatim_db.tokenizer import factory as tokenizer_factory
-from steps.utils import run_script
-
-class NominatimEnvironment:
-    """ Collects all functions for the execution of Nominatim functions.
-    """
-
-    def __init__(self, config):
-        self.src_dir = (Path(__file__) / '..' / '..' / '..' / '..').resolve()
-        self.db_host = config['DB_HOST']
-        self.db_port = config['DB_PORT']
-        self.db_user = config['DB_USER']
-        self.db_pass = config['DB_PASS']
-        self.template_db = config['TEMPLATE_DB']
-        self.test_db = config['TEST_DB']
-        self.api_test_db = config['API_TEST_DB']
-        self.api_test_file = config['API_TEST_FILE']
-        self.tokenizer = config['TOKENIZER']
-        self.import_style = config['STYLE']
-        self.reuse_template = not config['REMOVE_TEMPLATE']
-        self.keep_scenario_db = config['KEEP_TEST_DB']
-
-        self.default_config = Configuration(None).get_os_env()
-        self.test_env = None
-        self.template_db_done = False
-        self.api_db_done = False
-        self.website_dir = None
-
-        if not hasattr(self, f"create_api_request_func_{config['API_ENGINE']}"):
-            raise RuntimeError(f"Unknown API engine '{config['API_ENGINE']}'")
-        self.api_engine = getattr(self, f"create_api_request_func_{config['API_ENGINE']}")()
-
-    def connect_database(self, dbname):
-        """ Return a connection to the database with the given name.
-            Uses configured host, user and port.
-        """
-        dbargs = {'dbname': dbname, 'row_factory': psycopg.rows.dict_row}
-        if self.db_host:
-            dbargs['host'] = self.db_host
-        if self.db_port:
-            dbargs['port'] = self.db_port
-        if self.db_user:
-            dbargs['user'] = self.db_user
-        if self.db_pass:
-            dbargs['password'] = self.db_pass
-        return psycopg.connect(**dbargs)
-
-
-    def write_nominatim_config(self, dbname):
-        """ Set up a custom test configuration that connects to the given
-            database. This sets up the environment variables so that they can
-            be picked up by dotenv and creates a project directory with the
-            appropriate website scripts.
-        """
-        if dbname.startswith('sqlite:'):
-            dsn = 'sqlite:dbname={}'.format(dbname[7:])
-        else:
-            dsn = 'pgsql:dbname={}'.format(dbname)
-        if self.db_host:
-            dsn += ';host=' + self.db_host
-        if self.db_port:
-            dsn += ';port=' + self.db_port
-        if self.db_user:
-            dsn += ';user=' + self.db_user
-        if self.db_pass:
-            dsn += ';password=' + self.db_pass
-
-        self.test_env = dict(self.default_config)
-        self.test_env['NOMINATIM_DATABASE_DSN'] = dsn
-        self.test_env['NOMINATIM_LANGUAGES'] = 'en,de,fr,ja'
-        self.test_env['NOMINATIM_FLATNODE_FILE'] = ''
-        self.test_env['NOMINATIM_IMPORT_STYLE'] = 'full'
-        self.test_env['NOMINATIM_USE_US_TIGER_DATA'] = 'yes'
-        self.test_env['NOMINATIM_DATADIR'] = str((self.src_dir / 'data').resolve())
-        self.test_env['NOMINATIM_SQLDIR'] = str((self.src_dir / 'lib-sql').resolve())
-        self.test_env['NOMINATIM_CONFIGDIR'] = str((self.src_dir / 'settings').resolve())
-        if self.tokenizer is not None:
-            self.test_env['NOMINATIM_TOKENIZER'] = self.tokenizer
-        if self.import_style is not None:
-            self.test_env['NOMINATIM_IMPORT_STYLE'] = self.import_style
-
-        if self.website_dir is not None:
-            self.website_dir.cleanup()
-
-        self.website_dir = tempfile.TemporaryDirectory()
-
-
-    def get_test_config(self):
-        cfg = Configuration(Path(self.website_dir.name), environ=self.test_env)
-        return cfg
-
-    def get_libpq_dsn(self):
-        dsn = self.test_env['NOMINATIM_DATABASE_DSN']
-
-        def quote_param(param):
-            key, val = param.split('=')
-            val = val.replace('\\', '\\\\').replace("'", "\\'")
-            if ' ' in val:
-                val = "'" + val + "'"
-            return key + '=' + val
-
-        if dsn.startswith('pgsql:'):
-            # Old PHP DSN format. Convert before returning.
-            return ' '.join([quote_param(p) for p in dsn[6:].split(';')])
-
-        return dsn
-
-
-    def db_drop_database(self, name):
-        """ Drop the database with the given name.
-        """
-        with self.connect_database('postgres') as conn:
-            conn.autocommit = True
-            conn.execute(pysql.SQL('DROP DATABASE IF EXISTS')
-                         +  pysql.Identifier(name))
-
-    def setup_template_db(self):
-        """ Setup a template database that already contains common test data.
-            Having a template database speeds up tests considerably but at
-            the price that the tests sometimes run with stale data.
-        """
-        if self.template_db_done:
-            return
-
-        self.template_db_done = True
-
-        self.write_nominatim_config(self.template_db)
-
-        if not self._reuse_or_drop_db(self.template_db):
-            try:
-                # execute nominatim import on an empty file to get the right tables
-                with tempfile.NamedTemporaryFile(dir='/tmp', suffix='.xml') as fd:
-                    fd.write(b'<osm version="0.6"></osm>')
-                    fd.flush()
-                    self.run_nominatim('import', '--osm-file', fd.name,
-                                                 '--osm2pgsql-cache', '1',
-                                                 '--ignore-errors',
-                                                 '--offline', '--index-noanalyse')
-            except:
-                self.db_drop_database(self.template_db)
-                raise
-
-        self.run_nominatim('refresh', '--functions')
-
-
-    def setup_api_db(self):
-        """ Setup a test against the API test database.
-        """
-        self.write_nominatim_config(self.api_test_db)
-
-        if self.api_test_db.startswith('sqlite:'):
-            return
-
-        if not self.api_db_done:
-            self.api_db_done = True
-
-            if not self._reuse_or_drop_db(self.api_test_db):
-                testdata = (Path(__file__) / '..' / '..' / '..' / 'testdb').resolve()
-                self.test_env['NOMINATIM_WIKIPEDIA_DATA_PATH'] = str(testdata)
-                simp_file = Path(self.website_dir.name) / 'secondary_importance.sql.gz'
-                simp_file.symlink_to(testdata / 'secondary_importance.sql.gz')
-
-                try:
-                    self.run_nominatim('import', '--osm-file', str(self.api_test_file))
-                    self.run_nominatim('add-data', '--tiger-data', str(testdata / 'tiger'))
-                    self.run_nominatim('freeze')
-
-                    csv_path = str(testdata / 'full_en_phrases_test.csv')
-                    self.run_nominatim('special-phrases', '--import-from-csv', csv_path)
-                except:
-                    self.db_drop_database(self.api_test_db)
-                    raise
-
-        tokenizer_factory.get_tokenizer_for_db(self.get_test_config())
-
-
-    def setup_unknown_db(self):
-        """ Setup a test against a non-existing database.
-        """
-        # The tokenizer needs an existing database to function.
-        # So start with the usual database
-        class _Context:
-            db = None
-
-        context = _Context()
-        self.setup_db(context)
-        tokenizer_factory.create_tokenizer(self.get_test_config(), init_db=False)
-
-        # Then drop the DB again
-        self.teardown_db(context, force_drop=True)
-
-    def setup_db(self, context):
-        """ Setup a test against a fresh, empty test database.
-        """
-        self.setup_template_db()
-        with self.connect_database(self.template_db) as conn:
-            conn.autocommit = True
-            conn.execute(pysql.SQL('DROP DATABASE IF EXISTS')
-                                   + pysql.Identifier(self.test_db))
-            conn.execute(pysql.SQL('CREATE DATABASE {} TEMPLATE = {}').format(
-                           pysql.Identifier(self.test_db),
-                           pysql.Identifier(self.template_db)))
-
-        self.write_nominatim_config(self.test_db)
-        context.db = self.connect_database(self.test_db)
-        context.db.autocommit = True
-        register_hstore(context.db)
-
-    def teardown_db(self, context, force_drop=False):
-        """ Remove the test database, if it exists.
-        """
-        if hasattr(context, 'db'):
-            context.db.close()
-
-        if force_drop or not self.keep_scenario_db:
-            self.db_drop_database(self.test_db)
-
-    def _reuse_or_drop_db(self, name):
-        """ Check for the existence of the given DB. If reuse is enabled,
-            then the function checks for existnce and returns True if the
-            database is already there. Otherwise an existing database is
-            dropped and always false returned.
-        """
-        if self.reuse_template:
-            with self.connect_database('postgres') as conn:
-                num = execute_scalar(conn,
-                                     'select count(*) from pg_database where datname = %s',
-                                     (name,))
-                if num == 1:
-                    return True
-        else:
-            self.db_drop_database(name)
-
-        return False
-
-
-    def reindex_placex(self, db):
-        """ Run the indexing step until all data in the placex has
-            been processed. Indexing during updates can produce more data
-            to index under some circumstances. That is why indexing may have
-            to be run multiple times.
-        """
-        self.run_nominatim('index')
-
-
-    def run_nominatim(self, *cmdline):
-        """ Run the nominatim command-line tool via the library.
-        """
-        if self.website_dir is not None:
-            cmdline = list(cmdline) + ['--project-dir', self.website_dir.name]
-
-        cli.nominatim(osm2pgsql_path=None,
-                      cli_args=cmdline,
-                      environ=self.test_env)
-
-
-    def copy_from_place(self, db):
-        """ Copy data from place to the placex and location_property_osmline
-            tables invoking the appropriate triggers.
-        """
-        self.run_nominatim('refresh', '--functions', '--no-diff-updates')
-
-        with db.cursor() as cur:
-            cur.execute("""INSERT INTO placex (osm_type, osm_id, class, type,
-                                               name, admin_level, address,
-                                               extratags, geometry)
-                             SELECT osm_type, osm_id, class, type,
-                                    name, admin_level, address,
-                                    extratags, geometry
-                               FROM place
-                               WHERE not (class='place' and type='houses' and osm_type='W')""")
-            cur.execute("""INSERT INTO location_property_osmline (osm_id, address, linegeo)
-                             SELECT osm_id, address, geometry
-                               FROM place
-                              WHERE class='place' and type='houses'
-                                    and osm_type='W'
-                                    and ST_GeometryType(geometry) = 'ST_LineString'""")
-
-
-    def create_api_request_func_starlette(self):
-        import nominatim_api.server.starlette.server
-        from asgi_lifespan import LifespanManager
-        import httpx
-
-        async def _request(endpoint, params, project_dir, environ, http_headers):
-            app = nominatim_api.server.starlette.server.get_application(project_dir, environ)
-
-            async with LifespanManager(app):
-                async with httpx.AsyncClient(app=app, base_url="http://nominatim.test") as client:
-                    response = await client.get(f"/{endpoint}", params=params,
-                                                headers=http_headers)
-
-            return response.text, response.status_code
-
-        return _request
-
-
-    def create_api_request_func_falcon(self):
-        import nominatim_api.server.falcon.server
-        import falcon.testing
-
-        async def _request(endpoint, params, project_dir, environ, http_headers):
-            app = nominatim_api.server.falcon.server.get_application(project_dir, environ)
-
-            async with falcon.testing.ASGIConductor(app) as conductor:
-                response = await conductor.get(f"/{endpoint}", params=params,
-                                               headers=http_headers)
-
-            return response.text, response.status_code
-
-        return _request
-
-
-
diff --git a/test/bdd/steps/steps_api_queries.py b/test/bdd/steps/steps_api_queries.py
deleted file mode 100644
index 4d15381d..00000000
--- a/test/bdd/steps/steps_api_queries.py
+++ /dev/null
@@ -1,301 +0,0 @@
-# SPDX-License-Identifier: GPL-3.0-or-later
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2024 by the Nominatim developer community.
-# For a full list of authors see the git log.
-""" Steps that run queries against the API.
-"""
-from pathlib import Path
-import json
-import os
-import re
-import logging
-import asyncio
-import xml.etree.ElementTree as ET
-from urllib.parse import urlencode
-
-from utils import run_script
-from http_responses import GenericResponse, SearchResponse, ReverseResponse, StatusResponse
-from check_functions import Bbox, check_for_attributes
-from table_compare import NominatimID
-
-LOG = logging.getLogger(__name__)
-
-
-def make_todo_list(context, result_id):
-    if result_id is None:
-        context.execute_steps("then at least 1 result is returned")
-        return range(len(context.response.result))
-
-    context.execute_steps(f"then more than {result_id}results are returned")
-    return (int(result_id.strip()), )
-
-
-def compare(operator, op1, op2):
-    if operator == 'less than':
-        return op1 < op2
-    elif operator == 'more than':
-        return op1 > op2
-    elif operator == 'exactly':
-        return op1 == op2
-    elif operator == 'at least':
-        return op1 >= op2
-    elif operator == 'at most':
-        return op1 <= op2
-    else:
-        raise ValueError(f"Unknown operator '{operator}'")
-
-
-def send_api_query(endpoint, params, fmt, context):
-    if fmt is not None:
-        if fmt.strip() == 'debug':
-            params['debug'] = '1'
-        else:
-            params['format'] = fmt.strip()
-
-    if context.table:
-        if context.table.headings[0] == 'param':
-            for line in context.table:
-                params[line['param']] = line['value']
-        else:
-            for h in context.table.headings:
-                params[h] = context.table[0][h]
-
-    return asyncio.run(context.nominatim.api_engine(endpoint, params,
-                                                    Path(context.nominatim.website_dir.name),
-                                                    context.nominatim.test_env,
-                                                    getattr(context, 'http_headers', {})))
-
-
-@given(u'the HTTP header')
-def add_http_header(context):
-    if not hasattr(context, 'http_headers'):
-        context.http_headers = {}
-
-    for h in context.table.headings:
-        context.http_headers[h] = context.table[0][h]
-
-
-@when(u'sending (?P<fmt>\S+ )?search query "(?P<query>.*)"(?P<addr> with address)?')
-def website_search_request(context, fmt, query, addr):
-    params = {}
-    if query:
-        params['q'] = query
-    if addr is not None:
-        params['addressdetails'] = '1'
-
-    outp, status = send_api_query('search', params, fmt, context)
-
-    context.response = SearchResponse(outp, fmt or 'json', status)
-
-
-@when('sending v1/reverse at (?P<lat>[\d.-]*),(?P<lon>[\d.-]*)(?: with format (?P<fmt>.+))?')
-def api_endpoint_v1_reverse(context, lat, lon, fmt):
-    params = {}
-    if lat is not None:
-        params['lat'] = lat
-    if lon is not None:
-        params['lon'] = lon
-    if fmt is None:
-        fmt = 'jsonv2'
-    elif fmt == "''":
-        fmt = None
-
-    outp, status = send_api_query('reverse', params, fmt, context)
-    context.response = ReverseResponse(outp, fmt or 'xml', status)
-
-
-@when('sending v1/reverse N(?P<nodeid>\d+)(?: with format (?P<fmt>.+))?')
-def api_endpoint_v1_reverse_from_node(context, nodeid, fmt):
-    params = {}
-    params['lon'], params['lat'] = (f'{c:f}' for c in context.osm.grid_node(int(nodeid)))
-
-    outp, status = send_api_query('reverse', params, fmt, context)
-    context.response = ReverseResponse(outp, fmt or 'xml', status)
-
-
-@when(u'sending (?P<fmt>\S+ )?details query for (?P<query>.*)')
-def website_details_request(context, fmt, query):
-    params = {}
-    if query[0] in 'NWR':
-        nid = NominatimID(query)
-        params['osmtype'] = nid.typ
-        params['osmid'] = nid.oid
-        if nid.cls:
-            params['class'] = nid.cls
-    else:
-        params['place_id'] = query
-    outp, status = send_api_query('details', params, fmt, context)
-
-    context.response = GenericResponse(outp, fmt or 'json', status)
-
-@when(u'sending (?P<fmt>\S+ )?lookup query for (?P<query>.*)')
-def website_lookup_request(context, fmt, query):
-    params = { 'osm_ids' : query }
-    outp, status = send_api_query('lookup', params, fmt, context)
-
-    context.response = SearchResponse(outp, fmt or 'xml', status)
-
-@when(u'sending (?P<fmt>\S+ )?status query')
-def website_status_request(context, fmt):
-    params = {}
-    outp, status = send_api_query('status', params, fmt, context)
-
-    context.response = StatusResponse(outp, fmt or 'text', status)
-
-@step(u'(?P<operator>less than|more than|exactly|at least|at most) (?P<number>\d+) results? (?:is|are) returned')
-def validate_result_number(context, operator, number):
-    context.execute_steps("Then a HTTP 200 is returned")
-    numres = len(context.response.result)
-    assert compare(operator, numres, int(number)), \
-           f"Bad number of results: expected {operator} {number}, got {numres}."
-
-@then(u'a HTTP (?P<status>\d+) is returned')
-def check_http_return_status(context, status):
-    assert context.response.errorcode == int(status), \
-           f"Return HTTP status is {context.response.errorcode}."\
-           f" Full response:\n{context.response.page}"
-
-@then(u'the page contents equals "(?P<text>.+)"')
-def check_page_content_equals(context, text):
-    assert context.response.page == text
-
-@then(u'the result is valid (?P<fmt>\w+)')
-def step_impl(context, fmt):
-    context.execute_steps("Then a HTTP 200 is returned")
-    if fmt.strip() == 'html':
-        try:
-            tree = ET.fromstring(context.response.page)
-        except Exception as ex:
-            assert False, f"Could not parse page: {ex}\n{context.response.page}"
-
-        assert tree.tag == 'html'
-        body = tree.find('./body')
-        assert body is not None
-        assert body.find('.//script') is None
-    else:
-        assert context.response.format == fmt
-
-
-@then(u'a (?P<fmt>\w+) user error is returned')
-def check_page_error(context, fmt):
-    context.execute_steps("Then a HTTP 400 is returned")
-    assert context.response.format == fmt
-
-    if fmt == 'xml':
-        assert re.search(r'<error>.+</error>', context.response.page, re.DOTALL) is not None
-    else:
-        assert re.search(r'({"error":)', context.response.page, re.DOTALL) is not None
-
-@then(u'result header contains')
-def check_header_attr(context):
-    context.execute_steps("Then a HTTP 200 is returned")
-    for line in context.table:
-        assert line['attr'] in context.response.header, \
-               f"Field '{line['attr']}' missing in header. Full header:\n{context.response.header}"
-        value = context.response.header[line['attr']]
-        assert re.fullmatch(line['value'], value) is not None, \
-               f"Attribute '{line['attr']}': expected: '{line['value']}', got '{value}'"
-
-
-@then(u'result header has (?P<neg>not )?attributes (?P<attrs>.*)')
-def check_header_no_attr(context, neg, attrs):
-    check_for_attributes(context.response.header, attrs,
-                         'absent' if neg else 'present')
-
-
-@then(u'results contain(?: in field (?P<field>.*))?')
-def step_impl(context, field):
-    context.execute_steps("then at least 1 result is returned")
-
-    for line in context.table:
-        context.response.match_row(line, context=context, field=field)
-
-
-@then(u'result (?P<lid>\d+ )?has (?P<neg>not )?attributes (?P<attrs>.*)')
-def validate_attributes(context, lid, neg, attrs):
-    for i in make_todo_list(context, lid):
-        check_for_attributes(context.response.result[i], attrs,
-                             'absent' if neg else 'present')
-
-
-@then(u'result addresses contain')
-def step_impl(context):
-    context.execute_steps("then at least 1 result is returned")
-
-    for line in context.table:
-        idx = int(line['ID']) if 'ID' in line.headings else None
-
-        for name, value in zip(line.headings, line.cells):
-            if name != 'ID':
-                context.response.assert_address_field(idx, name, value)
-
-@then(u'address of result (?P<lid>\d+) has(?P<neg> no)? types (?P<attrs>.*)')
-def check_address(context, lid, neg, attrs):
-    context.execute_steps(f"then more than {lid} results are returned")
-
-    addr_parts = context.response.result[int(lid)]['address']
-
-    for attr in attrs.split(','):
-        if neg:
-            assert attr not in addr_parts
-        else:
-            assert attr in addr_parts
-
-@then(u'address of result (?P<lid>\d+) (?P<complete>is|contains)')
-def check_address(context, lid, complete):
-    context.execute_steps(f"then more than {lid} results are returned")
-
-    lid = int(lid)
-    addr_parts = dict(context.response.result[lid]['address'])
-
-    for line in context.table:
-        context.response.assert_address_field(lid, line['type'], line['value'])
-        del addr_parts[line['type']]
-
-    if complete == 'is':
-        assert len(addr_parts) == 0, f"Additional address parts found: {addr_parts!s}"
-
-
-@then(u'result (?P<lid>\d+ )?has bounding box in (?P<coords>[\d,.-]+)')
-def check_bounding_box_in_area(context, lid, coords):
-    expected = Bbox(coords)
-
-    for idx in make_todo_list(context, lid):
-        res = context.response.result[idx]
-        check_for_attributes(res, 'boundingbox')
-        context.response.check_row(idx, res['boundingbox'] in expected,
-                                   f"Bbox is not contained in {expected}")
-
-
-@then(u'result (?P<lid>\d+ )?has centroid in (?P<coords>[\d,.-]+)')
-def check_centroid_in_area(context, lid, coords):
-    expected = Bbox(coords)
-
-    for idx in make_todo_list(context, lid):
-        res = context.response.result[idx]
-        check_for_attributes(res, 'lat,lon')
-        context.response.check_row(idx, (res['lon'], res['lat']) in expected,
-                                   f"Centroid is not inside {expected}")
-
-
-@then(u'there are(?P<neg> no)? duplicates')
-def check_for_duplicates(context, neg):
-    context.execute_steps("then at least 1 result is returned")
-
-    resarr = set()
-    has_dupe = False
-
-    for res in context.response.result:
-        dup = (res['osm_type'], res['class'], res['type'], res['display_name'])
-        if dup in resarr:
-            has_dupe = True
-            break
-        resarr.add(dup)
-
-    if neg:
-        assert not has_dupe, f"Found duplicate for {dup}"
-    else:
-        assert has_dupe, "No duplicates found"
-
diff --git a/test/bdd/steps/steps_db_ops.py b/test/bdd/steps/steps_db_ops.py
deleted file mode 100644
index fb8431d5..00000000
--- a/test/bdd/steps/steps_db_ops.py
+++ /dev/null
@@ -1,450 +0,0 @@
-# SPDX-License-Identifier: GPL-3.0-or-later
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2024 by the Nominatim developer community.
-# For a full list of authors see the git log.
-import logging
-from itertools import chain
-
-import psycopg
-from psycopg import sql as pysql
-
-from place_inserter import PlaceColumn
-from table_compare import NominatimID, DBRow
-
-from nominatim_db.indexer import indexer
-from nominatim_db.tokenizer import factory as tokenizer_factory
-
-def check_database_integrity(context):
-    """ Check some generic constraints on the tables.
-    """
-    with context.db.cursor(row_factory=psycopg.rows.tuple_row) as cur:
-        # place_addressline should not have duplicate (place_id, address_place_id)
-        cur.execute("""SELECT count(*) FROM
-                        (SELECT place_id, address_place_id, count(*) as c
-                         FROM place_addressline GROUP BY place_id, address_place_id) x
-                       WHERE c > 1""")
-        assert cur.fetchone()[0] == 0, "Duplicates found in place_addressline"
-
-        # word table must not have empty word_tokens
-        cur.execute("SELECT count(*) FROM word WHERE word_token = ''")
-        assert cur.fetchone()[0] == 0, "Empty word tokens found in word table"
-
-
-
-################################ GIVEN ##################################
-
-@given("the (?P<named>named )?places")
-def add_data_to_place_table(context, named):
-    """ Add entries into the place table. 'named places' makes sure that
-        the entries get a random name when none is explicitly given.
-    """
-    with context.db.cursor() as cur:
-        cur.execute('ALTER TABLE place DISABLE TRIGGER place_before_insert')
-        for row in context.table:
-            PlaceColumn(context).add_row(row, named is not None).db_insert(cur)
-        cur.execute('ALTER TABLE place ENABLE TRIGGER place_before_insert')
-
-@given("the relations")
-def add_data_to_planet_relations(context):
-    """ Add entries into the osm2pgsql relation middle table. This is needed
-        for tests on data that looks up members.
-    """
-    with context.db.cursor() as cur:
-        cur.execute("SELECT value FROM osm2pgsql_properties WHERE property = 'db_format'")
-        row = cur.fetchone()
-        if row is None or row['value'] == '1':
-            for r in context.table:
-                last_node = 0
-                last_way = 0
-                parts = []
-                if r['members']:
-                    members = []
-                    for m in r['members'].split(','):
-                        mid = NominatimID(m)
-                        if mid.typ == 'N':
-                            parts.insert(last_node, int(mid.oid))
-                            last_node += 1
-                            last_way += 1
-                        elif mid.typ == 'W':
-                            parts.insert(last_way, int(mid.oid))
-                            last_way += 1
-                        else:
-                            parts.append(int(mid.oid))
-
-                        members.extend((mid.typ.lower() + mid.oid, mid.cls or ''))
-                else:
-                    members = None
-
-                tags = chain.from_iterable([(h[5:], r[h]) for h in r.headings if h.startswith("tags+")])
-
-                cur.execute("""INSERT INTO planet_osm_rels (id, way_off, rel_off, parts, members, tags)
-                               VALUES (%s, %s, %s, %s, %s, %s)""",
-                            (r['id'], last_node, last_way, parts, members, list(tags)))
-        else:
-            for r in context.table:
-                if r['members']:
-                    members = []
-                    for m in r['members'].split(','):
-                        mid = NominatimID(m)
-                        members.append({'ref': mid.oid, 'role': mid.cls or '', 'type': mid.typ})
-                else:
-                    members = []
-
-                tags = {h[5:]: r[h] for h in r.headings if h.startswith("tags+")}
-
-                cur.execute("""INSERT INTO planet_osm_rels (id, tags, members)
-                               VALUES (%s, %s, %s)""",
-                            (r['id'], psycopg.types.json.Json(tags),
-                             psycopg.types.json.Json(members)))
-
-@given("the ways")
-def add_data_to_planet_ways(context):
-    """ Add entries into the osm2pgsql way middle table. This is necessary for
-        tests on that that looks up node ids in this table.
-    """
-    with context.db.cursor() as cur:
-        cur.execute("SELECT value FROM osm2pgsql_properties WHERE property = 'db_format'")
-        row = cur.fetchone()
-        json_tags = row is not None and row['value'] != '1'
-        for r in context.table:
-            if json_tags:
-                tags = psycopg.types.json.Json({h[5:]: r[h] for h in r.headings if h.startswith("tags+")})
-            else:
-                tags = list(chain.from_iterable([(h[5:], r[h])
-                                                 for h in r.headings if h.startswith("tags+")]))
-            nodes = [ int(x.strip()) for x in r['nodes'].split(',') ]
-
-            cur.execute("INSERT INTO planet_osm_ways (id, nodes, tags) VALUES (%s, %s, %s)",
-                        (r['id'], nodes, tags))
-
-################################ WHEN ##################################
-
-@when("importing")
-def import_and_index_data_from_place_table(context):
-    """ Import data previously set up in the place table.
-    """
-    context.nominatim.run_nominatim('import', '--continue', 'load-data',
-                                              '--index-noanalyse', '-q',
-                                              '--offline')
-
-    check_database_integrity(context)
-
-    # Remove the output of the input, when all was right. Otherwise it will be
-    # output when there are errors that had nothing to do with the import
-    # itself.
-    context.log_capture.buffer.clear()
-
-@when("updating places")
-def update_place_table(context):
-    """ Update the place table with the given data. Also runs all triggers
-        related to updates and reindexes the new data.
-    """
-    context.nominatim.run_nominatim('refresh', '--functions')
-    with context.db.cursor() as cur:
-        for row in context.table:
-            col = PlaceColumn(context).add_row(row, False)
-            col.db_delete(cur)
-            col.db_insert(cur)
-        cur.execute('SELECT flush_deleted_places()')
-
-    context.nominatim.reindex_placex(context.db)
-    check_database_integrity(context)
-
-    # Remove the output of the input, when all was right. Otherwise it will be
-    # output when there are errors that had nothing to do with the import
-    # itself.
-    context.log_capture.buffer.clear()
-
-
-@when("updating postcodes")
-def update_postcodes(context):
-    """ Rerun the calculation of postcodes.
-    """
-    context.nominatim.run_nominatim('refresh', '--postcodes')
-
-@when("marking for delete (?P<oids>.*)")
-def delete_places(context, oids):
-    """ Remove entries from the place table. Multiple ids may be given
-        separated by commas. Also runs all triggers
-        related to updates and reindexes the new data.
-    """
-    context.nominatim.run_nominatim('refresh', '--functions')
-    with context.db.cursor() as cur:
-        cur.execute('TRUNCATE place_to_be_deleted')
-        for oid in oids.split(','):
-            NominatimID(oid).query_osm_id(cur, 'DELETE FROM place WHERE {}')
-        cur.execute('SELECT flush_deleted_places()')
-
-    context.nominatim.reindex_placex(context.db)
-
-    # Remove the output of the input, when all was right. Otherwise it will be
-    # output when there are errors that had nothing to do with the import
-    # itself.
-    context.log_capture.buffer.clear()
-
-################################ THEN ##################################
-
-@then("(?P<table>placex|place) contains(?P<exact> exactly)?")
-def check_place_contents(context, table, exact):
-    """ Check contents of place/placex tables. Each row represents a table row
-        and all data must match. Data not present in the expected table, may
-        be arbitrary. The rows are identified via the 'object' column which must
-        have an identifier of the form '<NRW><osm id>[:<class>]'. When multiple
-        rows match (for example because 'class' was left out and there are
-        multiple entries for the given OSM object) then all must match. All
-        expected rows are expected to be present with at least one database row.
-        When 'exactly' is given, there must not be additional rows in the database.
-    """
-    with context.db.cursor() as cur:
-        expected_content = set()
-        for row in context.table:
-            nid = NominatimID(row['object'])
-            query = 'SELECT *, ST_AsText(geometry) as geomtxt, ST_GeometryType(geometry) as geometrytype'
-            if table == 'placex':
-                query += ' ,ST_X(centroid) as cx, ST_Y(centroid) as cy'
-            query += " FROM %s WHERE {}" % (table, )
-            nid.query_osm_id(cur, query)
-            assert cur.rowcount > 0, "No rows found for " + row['object']
-
-            for res in cur:
-                if exact:
-                    expected_content.add((res['osm_type'], res['osm_id'], res['class']))
-
-                DBRow(nid, res, context).assert_row(row, ['object'])
-
-        if exact:
-            cur.execute(pysql.SQL('SELECT osm_type, osm_id, class from')
-                        + pysql.Identifier(table))
-            actual = set([(r['osm_type'], r['osm_id'], r['class']) for r in cur])
-            assert expected_content == actual, \
-                   f"Missing entries: {expected_content - actual}\n" \
-                   f"Not expected in table: {actual - expected_content}"
-
-
-@then("(?P<table>placex|place) has no entry for (?P<oid>.*)")
-def check_place_has_entry(context, table, oid):
-    """ Ensure that no database row for the given object exists. The ID
-        must be of the form '<NRW><osm id>[:<class>]'.
-    """
-    with context.db.cursor() as cur:
-        NominatimID(oid).query_osm_id(cur, "SELECT * FROM %s where {}" % table)
-        assert cur.rowcount == 0, \
-               "Found {} entries for ID {}".format(cur.rowcount, oid)
-
-
-@then("search_name contains(?P<exclude> not)?")
-def check_search_name_contents(context, exclude):
-    """ Check contents of place/placex tables. Each row represents a table row
-        and all data must match. Data not present in the expected table, may
-        be arbitrary. The rows are identified via the 'object' column which must
-        have an identifier of the form '<NRW><osm id>[:<class>]'. All
-        expected rows are expected to be present with at least one database row.
-    """
-    tokenizer = tokenizer_factory.get_tokenizer_for_db(context.nominatim.get_test_config())
-
-    with tokenizer.name_analyzer() as analyzer:
-        with context.db.cursor() as cur:
-            for row in context.table:
-                nid = NominatimID(row['object'])
-                nid.row_by_place_id(cur, 'search_name',
-                                    ['ST_X(centroid) as cx', 'ST_Y(centroid) as cy'])
-                assert cur.rowcount > 0, "No rows found for " + row['object']
-
-                for res in cur:
-                    db_row = DBRow(nid, res, context)
-                    for name, value in zip(row.headings, row.cells):
-                        if name in ('name_vector', 'nameaddress_vector'):
-                            items = [x.strip() for x in value.split(',')]
-                            tokens = analyzer.get_word_token_info(items)
-
-                            if not exclude:
-                                assert len(tokens) >= len(items), \
-                                       "No word entry found for {}. Entries found: {!s}".format(value, len(tokens))
-                            for word, token, wid in tokens:
-                                if exclude:
-                                    assert wid not in res[name], \
-                                           "Found term for {}/{}: {}".format(nid, name, wid)
-                                else:
-                                    assert wid in res[name], \
-                                           "Missing term for {}/{}: {}".format(nid, name, wid)
-                        elif name != 'object':
-                            assert db_row.contains(name, value), db_row.assert_msg(name, value)
-
-@then("search_name has no entry for (?P<oid>.*)")
-def check_search_name_has_entry(context, oid):
-    """ Check that there is noentry in the search_name table for the given
-        objects. IDs are in format '<NRW><osm id>[:<class>]'.
-    """
-    with context.db.cursor() as cur:
-        NominatimID(oid).row_by_place_id(cur, 'search_name')
-
-        assert cur.rowcount == 0, \
-               "Found {} entries for ID {}".format(cur.rowcount, oid)
-
-@then("location_postcode contains exactly")
-def check_location_postcode(context):
-    """ Check full contents for location_postcode table. Each row represents a table row
-        and all data must match. Data not present in the expected table, may
-        be arbitrary. The rows are identified via 'country' and 'postcode' columns.
-        All rows must be present as excepted and there must not be additional
-        rows.
-    """
-    with context.db.cursor() as cur:
-        cur.execute("SELECT *, ST_AsText(geometry) as geomtxt FROM location_postcode")
-        assert cur.rowcount == len(list(context.table)), \
-            "Postcode table has {} rows, expected {}.".format(cur.rowcount, len(list(context.table)))
-
-        results = {}
-        for row in cur:
-            key = (row['country_code'], row['postcode'])
-            assert key not in results, "Postcode table has duplicate entry: {}".format(row)
-            results[key] = DBRow((row['country_code'],row['postcode']), row, context)
-
-        for row in context.table:
-            db_row = results.get((row['country'],row['postcode']))
-            assert db_row is not None, \
-                f"Missing row for country '{row['country']}' postcode '{row['postcode']}'."
-
-            db_row.assert_row(row, ('country', 'postcode'))
-
-@then("there are(?P<exclude> no)? word tokens for postcodes (?P<postcodes>.*)")
-def check_word_table_for_postcodes(context, exclude, postcodes):
-    """ Check that the tokenizer produces postcode tokens for the given
-        postcodes. The postcodes are a comma-separated list of postcodes.
-        Whitespace matters.
-    """
-    nctx = context.nominatim
-    tokenizer = tokenizer_factory.get_tokenizer_for_db(nctx.get_test_config())
-    with tokenizer.name_analyzer() as ana:
-        plist = [ana.normalize_postcode(p) for p in postcodes.split(',')]
-
-    plist.sort()
-
-    with context.db.cursor() as cur:
-        cur.execute("SELECT word FROM word WHERE type = 'P' and word = any(%s)",
-                    (plist,))
-
-        found = [row['word'] for row in cur]
-        assert len(found) == len(set(found)), f"Duplicate rows for postcodes: {found}"
-
-    if exclude:
-        assert len(found) == 0, f"Unexpected postcodes: {found}"
-    else:
-        assert set(found) == set(plist), \
-        f"Missing postcodes {set(plist) - set(found)}. Found: {found}"
-
-@then("place_addressline contains")
-def check_place_addressline(context):
-    """ Check the contents of the place_addressline table. Each row represents
-        a table row and all data must match. Data not present in the expected
-        table, may be arbitrary. The rows are identified via the 'object' column,
-        representing the addressee and the 'address' column, representing the
-        address item.
-    """
-    with context.db.cursor() as cur:
-        for row in context.table:
-            nid = NominatimID(row['object'])
-            pid = nid.get_place_id(cur)
-            apid = NominatimID(row['address']).get_place_id(cur)
-            cur.execute(""" SELECT * FROM place_addressline
-                            WHERE place_id = %s AND address_place_id = %s""",
-                        (pid, apid))
-            assert cur.rowcount > 0, \
-                        "No rows found for place %s and address %s" % (row['object'], row['address'])
-
-            for res in cur:
-                DBRow(nid, res, context).assert_row(row, ('address', 'object'))
-
-@then("place_addressline doesn't contain")
-def check_place_addressline_exclude(context):
-    """ Check that the place_addressline doesn't contain any entries for the
-        given addressee/address item pairs.
-    """
-    with context.db.cursor() as cur:
-        for row in context.table:
-            pid = NominatimID(row['object']).get_place_id(cur)
-            apid = NominatimID(row['address']).get_place_id(cur, allow_empty=True)
-            if apid is not None:
-                cur.execute(""" SELECT * FROM place_addressline
-                                WHERE place_id = %s AND address_place_id = %s""",
-                            (pid, apid))
-                assert cur.rowcount == 0, \
-                    "Row found for place %s and address %s" % (row['object'], row['address'])
-
-@then("W(?P<oid>\d+) expands to(?P<neg> no)? interpolation")
-def check_location_property_osmline(context, oid, neg):
-    """ Check that the given way is present in the interpolation table.
-    """
-    with context.db.cursor() as cur:
-        cur.execute("""SELECT *, ST_AsText(linegeo) as geomtxt
-                       FROM location_property_osmline
-                       WHERE osm_id = %s AND startnumber IS NOT NULL""",
-                    (oid, ))
-
-        if neg:
-            assert cur.rowcount == 0, "Interpolation found for way {}.".format(oid)
-            return
-
-        todo = list(range(len(list(context.table))))
-        for res in cur:
-            for i in todo:
-                row = context.table[i]
-                if (int(row['start']) == res['startnumber']
-                    and int(row['end']) == res['endnumber']):
-                    todo.remove(i)
-                    break
-            else:
-                assert False, "Unexpected row " + str(res)
-
-            DBRow(oid, res, context).assert_row(row, ('start', 'end'))
-
-        assert not todo, f"Unmatched lines in table: {list(context.table[i] for i in todo)}"
-
-@then("location_property_osmline contains(?P<exact> exactly)?")
-def check_place_contents(context, exact):
-    """ Check contents of the interpolation table. Each row represents a table row
-        and all data must match. Data not present in the expected table, may
-        be arbitrary. The rows are identified via the 'object' column which must
-        have an identifier of the form '<osm id>[:<startnumber>]'. When multiple
-        rows match (for example because 'startnumber' was left out and there are
-        multiple entries for the given OSM object) then all must match. All
-        expected rows are expected to be present with at least one database row.
-        When 'exactly' is given, there must not be additional rows in the database.
-    """
-    with context.db.cursor() as cur:
-        expected_content = set()
-        for row in context.table:
-            if ':' in row['object']:
-                nid, start = row['object'].split(':', 2)
-                start = int(start)
-            else:
-                nid, start = row['object'], None
-
-            query = """SELECT *, ST_AsText(linegeo) as geomtxt,
-                              ST_GeometryType(linegeo) as geometrytype
-                       FROM location_property_osmline WHERE osm_id=%s"""
-
-            if ':' in row['object']:
-                query += ' and startnumber = %s'
-                params = [int(val) for val in row['object'].split(':', 2)]
-            else:
-                params = (int(row['object']), )
-
-            cur.execute(query, params)
-            assert cur.rowcount > 0, "No rows found for " + row['object']
-
-            for res in cur:
-                if exact:
-                    expected_content.add((res['osm_id'], res['startnumber']))
-
-                DBRow(nid, res, context).assert_row(row, ['object'])
-
-        if exact:
-            cur.execute('SELECT osm_id, startnumber from location_property_osmline')
-            actual = set([(r['osm_id'], r['startnumber']) for r in cur])
-            assert expected_content == actual, \
-                   f"Missing entries: {expected_content - actual}\n" \
-                   f"Not expected in table: {actual - expected_content}"
-
diff --git a/test/bdd/steps/steps_osm_data.py b/test/bdd/steps/steps_osm_data.py
deleted file mode 100644
index 4cee75f7..00000000
--- a/test/bdd/steps/steps_osm_data.py
+++ /dev/null
@@ -1,142 +0,0 @@
-# SPDX-License-Identifier: GPL-3.0-or-later
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2024 by the Nominatim developer community.
-# For a full list of authors see the git log.
-import tempfile
-import random
-import os
-from pathlib import Path
-
-from nominatim_db.tools.exec_utils import run_osm2pgsql
-from nominatim_db.tools.replication import run_osm2pgsql_updates
-
-from geometry_alias import ALIASES
-
-def get_osm2pgsql_options(nominatim_env, fname, append):
-    return dict(import_file=fname,
-                osm2pgsql='osm2pgsql',
-                osm2pgsql_cache=50,
-                osm2pgsql_style=str(nominatim_env.get_test_config().get_import_style_file()),
-                osm2pgsql_style_path=nominatim_env.get_test_config().config_dir,
-                threads=1,
-                dsn=nominatim_env.get_libpq_dsn(),
-                flatnode_file='',
-                tablespaces=dict(slim_data='', slim_index='',
-                                 main_data='', main_index=''),
-                append=append
-               )
-
-
-def write_opl_file(opl, grid):
-    """ Create a temporary OSM file from OPL and return the file name. It is
-        the responsibility of the caller to delete the file again.
-
-        Node with missing coordinates, can retrieve their coordinates from
-        a supplied grid. Failing that a random coordinate is assigned.
-    """
-    with tempfile.NamedTemporaryFile(suffix='.opl', delete=False) as fd:
-        for line in opl.splitlines():
-            if line.startswith('n') and line.find(' x') < 0:
-                coord = grid.grid_node(int(line[1:].split(' ')[0]))
-                if coord is None:
-                    coord = (random.random() * 360 - 180,
-                             random.random() * 180 - 90)
-                line += " x%f y%f" % coord
-            fd.write(line.encode('utf-8'))
-            fd.write(b'\n')
-
-        return fd.name
-
-@given('the lua style file')
-def lua_style_file(context):
-    """ Define a custom style file to use for the import.
-    """
-    style = Path(context.nominatim.website_dir.name) / 'custom.lua'
-    style.write_text(context.text)
-    context.nominatim.test_env['NOMINATIM_IMPORT_STYLE'] = str(style)
-
-
-@given(u'the ([0-9.]+ )?grid(?: with origin (?P<origin>.*))?')
-def define_node_grid(context, grid_step, origin):
-    """
-    Define a grid of node positions.
-    Use a table to define the grid. The nodes must be integer ids. Optionally
-    you can give the grid distance. The default is 0.00001 degrees.
-    """
-    if grid_step is not None:
-        grid_step = float(grid_step.strip())
-    else:
-        grid_step = 0.00001
-
-    if origin:
-        if ',' in origin:
-            # TODO coordinate
-            coords = origin.split(',')
-            if len(coords) != 2:
-                raise RuntimeError('Grid origin expects origin with x,y coordinates.')
-            origin = (float(coords[0]), float(coords[1]))
-        elif origin in ALIASES:
-            origin = ALIASES[origin]
-        else:
-            raise RuntimeError('Grid origin must be either coordinate or alias.')
-    else:
-        origin = (0.0, 0.0)
-
-    context.osm.set_grid([context.table.headings] + [list(h) for h in context.table],
-                         grid_step, origin)
-
-
-@when(u'loading osm data')
-def load_osm_file(context):
-    """
-    Load the given data into a freshly created test data using osm2pgsql.
-    No further indexing is done.
-
-    The data is expected as attached text in OPL format.
-    """
-    # create an OSM file and import it
-    fname = write_opl_file(context.text, context.osm)
-    try:
-        run_osm2pgsql(get_osm2pgsql_options(context.nominatim, fname, append=False))
-    finally:
-        os.remove(fname)
-
-    ### reintroduce the triggers/indexes we've lost by having osm2pgsql set up place again
-    cur = context.db.cursor()
-    cur.execute("""CREATE TRIGGER place_before_delete BEFORE DELETE ON place
-                    FOR EACH ROW EXECUTE PROCEDURE place_delete()""")
-    cur.execute("""CREATE TRIGGER place_before_insert BEFORE INSERT ON place
-                   FOR EACH ROW EXECUTE PROCEDURE place_insert()""")
-    cur.execute("""CREATE UNIQUE INDEX idx_place_osm_unique on place using btree(osm_id,osm_type,class,type)""")
-    context.db.commit()
-
-
-@when(u'updating osm data')
-def update_from_osm_file(context):
-    """
-    Update a database previously populated with 'loading osm data'.
-    Needs to run indexing on the existing data first to yield the correct result.
-
-    The data is expected as attached text in OPL format.
-    """
-    context.nominatim.copy_from_place(context.db)
-    context.nominatim.run_nominatim('index')
-    context.nominatim.run_nominatim('refresh', '--functions')
-
-    # create an OSM file and import it
-    fname = write_opl_file(context.text, context.osm)
-    try:
-        run_osm2pgsql_updates(context.db,
-                              get_osm2pgsql_options(context.nominatim, fname, append=True))
-    finally:
-        os.remove(fname)
-
-@when('indexing')
-def index_database(context):
-    """
-    Run the Nominatim indexing step. This will process data previously
-    loaded with 'updating osm data'
-    """
-    context.nominatim.run_nominatim('index')
diff --git a/test/bdd/steps/table_compare.py b/test/bdd/steps/table_compare.py
deleted file mode 100644
index 4284fad9..00000000
--- a/test/bdd/steps/table_compare.py
+++ /dev/null
@@ -1,227 +0,0 @@
-# SPDX-License-Identifier: GPL-2.0-only
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2022 by the Nominatim developer community.
-# For a full list of authors see the git log.
-"""
-Functions to facilitate accessing and comparing the content of DB tables.
-"""
-import re
-import json
-
-import psycopg
-from psycopg import sql as pysql
-
-from steps.check_functions import Almost
-
-ID_REGEX = re.compile(r"(?P<typ>[NRW])(?P<oid>\d+)(:(?P<cls>\w+))?")
-
-class NominatimID:
-    """ Splits a unique identifier for places into its components.
-        As place_ids cannot be used for testing, we use a unique
-        identifier instead that is of the form <osmtype><osmid>[:<class>].
-    """
-
-    def __init__(self, oid):
-        self.typ = self.oid = self.cls = None
-
-        if oid is not None:
-            m = ID_REGEX.fullmatch(oid)
-            assert m is not None, \
-                   "ID '{}' not of form <osmtype><osmid>[:<class>]".format(oid)
-
-            self.typ = m.group('typ')
-            self.oid = m.group('oid')
-            self.cls = m.group('cls')
-
-    def __str__(self):
-        if self.cls is None:
-            return self.typ + self.oid
-
-        return '{self.typ}{self.oid}:{self.cls}'.format(self=self)
-
-    def query_osm_id(self, cur, query):
-        """ Run a query on cursor `cur` using osm ID, type and class. The
-            `query` string must contain exactly one placeholder '{}' where
-            the 'where' query should go.
-        """
-        where = 'osm_type = %s and osm_id = %s'
-        params = [self.typ, self. oid]
-
-        if self.cls is not None:
-            where += ' and class = %s'
-            params.append(self.cls)
-
-        cur.execute(query.format(where), params)
-
-    def row_by_place_id(self, cur, table, extra_columns=None):
-        """ Get a row by place_id from the given table using cursor `cur`.
-            extra_columns may contain a list additional elements for the select
-            part of the query.
-        """
-        pid = self.get_place_id(cur)
-        query = "SELECT {} FROM {} WHERE place_id = %s".format(
-                    ','.join(['*'] + (extra_columns or [])), table)
-        cur.execute(query, (pid, ))
-
-    def get_place_id(self, cur, allow_empty=False):
-        """ Look up the place id for the ID. Throws an assertion if the ID
-            is not unique.
-        """
-        self.query_osm_id(cur, "SELECT place_id FROM placex WHERE {}")
-        if cur.rowcount == 0 and allow_empty:
-            return None
-
-        assert cur.rowcount == 1, \
-               "Place ID {!s} not unique. Found {} entries.".format(self, cur.rowcount)
-
-        return cur.fetchone()['place_id']
-
-
-class DBRow:
-    """ Represents a row from a database and offers comparison functions.
-    """
-    def __init__(self, nid, db_row, context):
-        self.nid = nid
-        self.db_row = db_row
-        self.context = context
-
-    def assert_row(self, row, exclude_columns):
-        """ Check that all columns of the given behave row are contained
-            in the database row. Exclude behave rows with the names given
-            in the `exclude_columns` list.
-        """
-        for name, value in zip(row.headings, row.cells):
-            if name not in exclude_columns:
-                assert self.contains(name, value), self.assert_msg(name, value)
-
-    def contains(self, name, expected):
-        """ Check that the DB row contains a column `name` with the given value.
-        """
-        if '+' in name:
-            column, field = name.split('+', 1)
-            return self._contains_hstore_value(column, field, expected)
-
-        if name == 'geometry':
-            return self._has_geometry(expected)
-
-        if name not in self.db_row:
-            return False
-
-        actual = self.db_row[name]
-
-        if expected == '-':
-            return actual is None
-
-        if name == 'name' and ':' not in expected:
-            return self._compare_column(actual[name], expected)
-
-        if 'place_id' in name:
-            return self._compare_place_id(actual, expected)
-
-        if name == 'centroid':
-            return self._has_centroid(expected)
-
-        return self._compare_column(actual, expected)
-
-    def _contains_hstore_value(self, column, field, expected):
-        if column == 'addr':
-            column = 'address'
-
-        if column not in self.db_row:
-            return False
-
-        if expected == '-':
-            return self.db_row[column] is None or field not in self.db_row[column]
-
-        if self.db_row[column] is None:
-            return False
-
-        return self._compare_column(self.db_row[column].get(field), expected)
-
-    def _compare_column(self, actual, expected):
-        if isinstance(actual, dict):
-            return actual == eval('{' + expected + '}')
-
-        return str(actual) == expected
-
-    def _compare_place_id(self, actual, expected):
-       if expected == '0':
-            return actual == 0
-
-       with self.context.db.cursor() as cur:
-            return NominatimID(expected).get_place_id(cur) == actual
-
-    def _has_centroid(self, expected):
-        if expected == 'in geometry':
-            with self.context.db.cursor(row_factory=psycopg.rows.tuple_row) as cur:
-                cur.execute("""SELECT ST_Within(ST_SetSRID(ST_Point(%(cx)s, %(cy)s), 4326),
-                                        ST_SetSRID(%(geomtxt)s::geometry, 4326))""",
-                            (self.db_row))
-                return cur.fetchone()[0]
-
-        if ' ' in expected:
-            x, y = expected.split(' ')
-        else:
-            x, y = self.context.osm.grid_node(int(expected))
-
-        return Almost(float(x)) == self.db_row['cx'] and Almost(float(y)) == self.db_row['cy']
-
-    def _has_geometry(self, expected):
-        geom = self.context.osm.parse_geometry(expected)
-        with self.context.db.cursor(row_factory=psycopg.rows.tuple_row) as cur:
-            cur.execute(pysql.SQL("""SELECT ST_Equals(ST_SnapToGrid({}, 0.00001, 0.00001),
-                                   ST_SnapToGrid(ST_SetSRID({}::geometry, 4326), 0.00001, 0.00001))""")
-                             .format(pysql.SQL(geom),
-                                     pysql.Literal(self.db_row['geomtxt'])))
-            return cur.fetchone()[0]
-
-    def assert_msg(self, name, value):
-        """ Return a string with an informative message for a failed compare.
-        """
-        msg = "\nBad column '{}' in row '{!s}'.".format(name, self.nid)
-        actual = self._get_actual(name)
-        if actual is not None:
-            msg += " Expected: {}, got: {}.".format(value, actual)
-        else:
-            msg += " No such column."
-
-        return msg + "\nFull DB row: {}".format(json.dumps(dict(self.db_row), indent=4, default=str))
-
-    def _get_actual(self, name):
-        if '+' in name:
-            column, field = name.split('+', 1)
-            if column == 'addr':
-                column = 'address'
-            return (self.db_row.get(column) or {}).get(field)
-
-        if name == 'geometry':
-            return self.db_row['geomtxt']
-
-        if name not in self.db_row:
-            return None
-
-        if name == 'centroid':
-            return "POINT({cx} {cy})".format(**self.db_row)
-
-        actual = self.db_row[name]
-
-        if 'place_id' in name:
-            if actual is None:
-                return '<null>'
-
-            if actual == 0:
-                return "place ID 0"
-
-            with self.context.db.cursor(row_factory=psycopg.rows.tuple_row) as cur:
-                cur.execute("""SELECT osm_type, osm_id, class
-                               FROM placex WHERE place_id = %s""",
-                            (actual, ))
-
-                if cur.rowcount == 1:
-                    return "{0[0]}{0[1]}:{0[2]}".format(cur.fetchone())
-
-                return "[place ID {} not found]".format(actual)
-
-        return actual
diff --git a/test/bdd/steps/utils.py b/test/bdd/steps/utils.py
deleted file mode 100644
index e789deff..00000000
--- a/test/bdd/steps/utils.py
+++ /dev/null
@@ -1,28 +0,0 @@
-# SPDX-License-Identifier: GPL-2.0-only
-#
-# This file is part of Nominatim. (https://nominatim.org)
-#
-# Copyright (C) 2022 by the Nominatim developer community.
-# For a full list of authors see the git log.
-"""
-Various smaller helps for step execution.
-"""
-import logging
-import subprocess
-
-LOG = logging.getLogger(__name__)
-
-def run_script(cmd, **kwargs):
-    """ Run the given command, check that it is successful and output
-        when necessary.
-    """
-    proc = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE,
-                            **kwargs)
-    (outp, outerr) = proc.communicate()
-    outp = outp.decode('utf-8')
-    outerr = outerr.decode('utf-8').replace('\\n', '\n')
-    LOG.debug("Run command: %s\n%s\n%s", cmd, outp, outerr)
-
-    assert proc.returncode == 0, "Script '{}' failed:\n{}\n{}\n".format(cmd[0], outp, outerr)
-
-    return outp, outerr
diff --git a/test/bdd/test_api.py b/test/bdd/test_api.py
new file mode 100644
index 00000000..5ace7b94
--- /dev/null
+++ b/test/bdd/test_api.py
@@ -0,0 +1,153 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Collector for all BDD API tests.
+
+These tests work on a static test database that is the same for all tests.
+The source data for the database can be found in the test/testdb directory.
+"""
+from pathlib import Path
+import xml.etree.ElementTree as ET
+
+import pytest
+from pytest_bdd.parsers import re as step_parse
+from pytest_bdd import scenarios, when, given, then
+
+from nominatim_db import cli
+from nominatim_db.config import Configuration
+
+from utils.db import DBManager
+from utils.api_runner import APIRunner
+from utils.api_result import APIResult
+
+
+TESTDB_PATH = (Path(__file__) / '..' / '..' / 'testdb').resolve()
+
+CONTENT_TYPES = {
+    'json': 'application/json; charset=utf-8',
+    'xml': 'text/xml; charset=utf-8',
+    'geojson': 'application/json; charset=utf-8',
+    'geocodejson': 'application/json; charset=utf-8',
+    'html': 'text/html; charset=utf-8'
+}
+
+
+@pytest.fixture(autouse=True, scope='session')
+def session_api_test_db(pytestconfig):
+    """ Create a Nominatim database from the official API test data.
+        Will only recreate an existing database if --nominatim-purge
+        was set.
+    """
+    dbname = pytestconfig.getini('nominatim_api_test_db')
+
+    config = Configuration(None).get_os_env()
+    config['NOMINATIM_DATABASE_DSN'] = f"pgsql:dbname={dbname}"
+    config['NOMINATIM_LANGUAGES'] = 'en,de,fr,ja'
+    config['NOMINATIM_USE_US_TIGER_DATA'] = 'yes'
+    if pytestconfig.option.NOMINATIM_TOKENIZER is not None:
+        config['NOMINATIM_TOKENIZER'] = pytestconfig.option.NOMINATIM_TOKENIZER
+
+    dbm = DBManager(purge=pytestconfig.option.NOMINATIM_PURGE)
+
+    if not dbm.check_for_db(dbname):
+        try:
+            cli.nominatim(cli_args=['import', '--project-dir', str(TESTDB_PATH),
+                                    '--osm-file', str(TESTDB_PATH / 'apidb-test-data.pbf')],
+                          environ=config)
+            cli.nominatim(cli_args=['add-data', '--project-dir', str(TESTDB_PATH),
+                                    '--tiger-data', str(TESTDB_PATH / 'tiger')],
+                          environ=config)
+            cli.nominatim(cli_args=['freeze', '--project-dir', str(TESTDB_PATH)],
+                          environ=config)
+            cli.nominatim(cli_args=['special-phrases', '--project-dir', str(TESTDB_PATH),
+                                    '--import-from-csv',
+                                    str(TESTDB_PATH / 'full_en_phrases_test.csv')],
+                          environ=config)
+        except:  # noqa: E722
+            dbm.drop_db(dbname)
+            raise
+
+
+@pytest.fixture
+def test_config_env(pytestconfig):
+    dbname = pytestconfig.getini('nominatim_api_test_db')
+
+    config = Configuration(None).get_os_env()
+    config['NOMINATIM_DATABASE_DSN'] = f"pgsql:dbname={dbname}"
+    config['NOMINATIM_LANGUAGES'] = 'en,de,fr,ja'
+    config['NOMINATIM_USE_US_TIGER_DATA'] = 'yes'
+    if pytestconfig.option.NOMINATIM_TOKENIZER is not None:
+        config['NOMINATIM_TOKENIZER'] = pytestconfig.option.NOMINATIM_TOKENIZER
+
+    return config
+
+
+@pytest.fixture
+def api_http_request_headers():
+    return {}
+
+
+@given('the HTTP header', target_fixture='api_http_request_headers')
+def set_additional_http_headers(api_http_request_headers, datatable):
+    api_http_request_headers.update(zip(datatable[0], datatable[1]))
+    return api_http_request_headers
+
+
+@given('an unknown database', target_fixture='test_config_env')
+def setup_connection_unknown_database(test_config_env):
+    test_config_env['NOMINATIM_DATABASE_DSN'] = "pgsql:dbname=gerlkghngergn6732nf"
+    return test_config_env
+
+
+@when(step_parse(r'sending v1/(?P<endpoint>\S+)(?: with format (?P<fmt>\S+))?'),
+      target_fixture='api_response')
+def send_api_status(test_config_env, api_http_request_headers, pytestconfig,
+                    datatable, endpoint, fmt):
+    runner = APIRunner(test_config_env, pytestconfig.option.NOMINATIM_API_ENGINE)
+    return runner.run_step(endpoint, {}, datatable, fmt, api_http_request_headers)
+
+
+@then(step_parse(r'a HTTP (?P<status>\d+) is returned'), converters={'status': int})
+def check_http_result(api_response, status):
+    assert api_response.status == status
+
+
+@then(step_parse('the page content equals "(?P<content>.*)"'))
+def check_page_content_exact(api_response, content):
+    assert api_response.body == content
+
+
+@then('the result is valid html')
+def check_for_html_correctness(api_response):
+    assert api_response.headers['content-type'] == CONTENT_TYPES['html']
+
+    try:
+        tree = ET.fromstring(api_response.body)
+    except Exception as ex:
+        assert False, f"Could not parse page: {ex}\n{api_response.body}"
+
+    assert tree.tag == 'html'
+
+    body = tree.find('./body')
+    assert body is not None
+    assert body.find('.//script') is None
+
+
+@then(step_parse(r'the result is valid (?P<fmt>\S+)(?: with (?P<num>\d+) results?)?'),
+      target_fixture='nominatim_result')
+def parse_api_json_response(api_response, fmt, num):
+    assert api_response.headers['content-type'] == CONTENT_TYPES[fmt]
+
+    result = APIResult(fmt, api_response.endpoint, api_response.body)
+
+    if num:
+        assert len(result) == int(num)
+
+    return result
+
+
+scenarios('features/api')
diff --git a/test/bdd/test_db.py b/test/bdd/test_db.py
new file mode 100644
index 00000000..01cec9e3
--- /dev/null
+++ b/test/bdd/test_db.py
@@ -0,0 +1,244 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Collector for BDD import acceptance tests.
+
+These tests check the Nominatim import chain after the osm2pgsql import.
+"""
+import asyncio
+import re
+
+import psycopg
+
+import pytest
+from pytest_bdd import scenarios, when, then, given
+from pytest_bdd.parsers import re as step_parse
+
+from utils.place_inserter import PlaceColumn
+from utils.checks import check_table_content
+
+from nominatim_db.config import Configuration
+from nominatim_db import cli
+from nominatim_db.tools.database_import import load_data, create_table_triggers
+from nominatim_db.tools.postcodes import update_postcodes
+from nominatim_db.tokenizer import factory as tokenizer_factory
+
+
+def _rewrite_placeid_field(field, new_field, datatable, place_ids):
+    try:
+        oidx = datatable[0].index(field)
+        datatable[0][oidx] = new_field
+        for line in datatable[1:]:
+            line[oidx] = None if line[oidx] == '-' else place_ids[line[oidx]]
+    except ValueError:
+        pass
+
+
+def _collect_place_ids(conn):
+    pids = {}
+    with conn.cursor() as cur:
+        for row in cur.execute('SELECT place_id, osm_type, osm_id, class FROM placex'):
+            pids[f"{row[1]}{row[2]}"] = row[0]
+            pids[f"{row[1]}{row[2]}:{row[3]}"] = row[0]
+
+    return pids
+
+
+@pytest.fixture
+def test_config_env(pytestconfig):
+    dbname = pytestconfig.getini('nominatim_test_db')
+
+    config = Configuration(None).get_os_env()
+    config['NOMINATIM_DATABASE_DSN'] = f"pgsql:dbname={dbname}"
+    config['NOMINATIM_LANGUAGES'] = 'en,de,fr,ja'
+    config['NOMINATIM_USE_US_TIGER_DATA'] = 'yes'
+    if pytestconfig.option.NOMINATIM_TOKENIZER is not None:
+        config['NOMINATIM_TOKENIZER'] = pytestconfig.option.NOMINATIM_TOKENIZER
+
+    return config
+
+
+@pytest.fixture
+def update_config(def_config):
+    """ Prepare the database for being updatable and return the config.
+    """
+    cli.nominatim(['refresh', '--functions'], def_config.environ)
+
+    return def_config
+
+
+@given(step_parse('the (?P<named>named )?places'), target_fixture=None)
+def import_places(db_conn, named, datatable, node_grid):
+    """ Insert todo rows into the place table.
+        When 'named' is given, then a random name will be generated for all
+        objects.
+    """
+    with db_conn.cursor() as cur:
+        for row in datatable[1:]:
+            PlaceColumn(node_grid).add_row(datatable[0], row, named is not None).db_insert(cur)
+
+
+@given('the ways', target_fixture=None)
+def import_ways(db_conn, datatable):
+    """ Import raw ways into the osm2pgsql way middle table.
+    """
+    with db_conn.cursor() as cur:
+        id_idx = datatable[0].index('id')
+        node_idx = datatable[0].index('nodes')
+        for line in datatable[1:]:
+            tags = psycopg.types.json.Json(
+                {k[5:]: v for k, v in zip(datatable[0], line)
+                 if k.startswith("tags+")})
+            nodes = [int(x) for x in line[node_idx].split(',')]
+
+            cur.execute("INSERT INTO planet_osm_ways (id, nodes, tags) VALUES (%s, %s, %s)",
+                        (line[id_idx], nodes, tags))
+
+
+@given('the relations', target_fixture=None)
+def import_rels(db_conn, datatable):
+    """ Import raw relations into the osm2pgsql relation middle table.
+    """
+    with db_conn.cursor() as cur:
+        id_idx = datatable[0].index('id')
+        memb_idx = datatable[0].index('members')
+        for line in datatable[1:]:
+            tags = psycopg.types.json.Json(
+                {k[5:]: v for k, v in zip(datatable[0], line)
+                 if k.startswith("tags+")})
+            members = []
+            if line[memb_idx]:
+                for member in line[memb_idx].split(','):
+                    m = re.fullmatch(r'\s*([RWN])(\d+)(?::(\S+))?\s*', member)
+                    if not m:
+                        raise ValueError(f'Illegal member {member}.')
+                    members.append({'ref': int(m[2]), 'role': m[3] or '', 'type': m[1]})
+
+            cur.execute('INSERT INTO planet_osm_rels (id, tags, members) VALUES (%s, %s, %s)',
+                        (int(line[id_idx]), tags, psycopg.types.json.Json(members)))
+
+
+@when('importing', target_fixture='place_ids')
+def do_import(db_conn, def_config):
+    """ Run a reduced version of the Nominatim import.
+    """
+    create_table_triggers(db_conn, def_config)
+    asyncio.run(load_data(def_config.get_libpq_dsn(), 1))
+    tokenizer = tokenizer_factory.get_tokenizer_for_db(def_config)
+    update_postcodes(def_config.get_libpq_dsn(), None, tokenizer)
+    cli.nominatim(['index', '-q'], def_config.environ)
+
+    return _collect_place_ids(db_conn)
+
+
+@when('updating places', target_fixture='place_ids')
+def do_update(db_conn, update_config, node_grid, datatable):
+    """ Update the place table with the given data. Also runs all triggers
+        related to updates and reindexes the new data.
+    """
+    with db_conn.cursor() as cur:
+        for row in datatable[1:]:
+            PlaceColumn(node_grid).add_row(datatable[0], row, False).db_insert(cur)
+        cur.execute('SELECT flush_deleted_places()')
+    db_conn.commit()
+
+    cli.nominatim(['index', '-q'], update_config.environ)
+
+    return _collect_place_ids(db_conn)
+
+
+@when('updating postcodes')
+def do_postcode_update(update_config):
+    """ Recompute the postcode centroids.
+    """
+    cli.nominatim(['refresh', '--postcodes'], update_config.environ)
+
+
+@when(step_parse(r'marking for delete (?P<otype>[NRW])(?P<oid>\d+)'),
+      converters={'oid': int})
+def do_delete_place(db_conn, update_config, node_grid, otype, oid):
+    """ Remove the given place from the database.
+    """
+    with db_conn.cursor() as cur:
+        cur.execute('TRUNCATE place_to_be_deleted')
+        cur.execute('DELETE FROM place WHERE osm_type = %s and osm_id = %s',
+                    (otype, oid))
+        cur.execute('SELECT flush_deleted_places()')
+    db_conn.commit()
+
+    cli.nominatim(['index', '-q'], update_config.environ)
+
+
+@then(step_parse(r'(?P<table>\w+) contains(?P<exact> exactly)?'))
+def then_check_table_content(db_conn, place_ids, datatable, node_grid, table, exact):
+    _rewrite_placeid_field('object', 'place_id', datatable, place_ids)
+    _rewrite_placeid_field('parent_place_id', 'parent_place_id', datatable, place_ids)
+    _rewrite_placeid_field('linked_place_id', 'linked_place_id', datatable, place_ids)
+    if table == 'place_addressline':
+        _rewrite_placeid_field('address', 'address_place_id', datatable, place_ids)
+
+    for i, title in enumerate(datatable[0]):
+        if title.startswith('addr+'):
+            datatable[0][i] = f"address+{title[5:]}"
+
+    check_table_content(db_conn, table, datatable, grid=node_grid, exact=bool(exact))
+
+
+@then(step_parse(r'(DISABLED?P<table>placex?) has no entry for (?P<oid>[NRW]\d+(?::\S+)?)'))
+def then_check_place_missing_lines(db_conn, place_ids, table, oid):
+    assert oid in place_ids
+
+    sql = pysql.SQL("""SELECT count(*) FROM {}
+                       WHERE place_id = %s""").format(pysql.Identifier(tablename))
+
+    with conn.cursor(row_factory=tuple_row) as cur:
+        assert cur.execute(sql, [place_ids[oid]]).fetchone()[0] == 0
+
+
+@then(step_parse(r'W(?P<oid>\d+) expands to interpolation'),
+      converters={'oid': int})
+def then_check_interpolation_table(db_conn, node_grid, place_ids, oid, datatable):
+    with db_conn.cursor() as cur:
+        cur.execute('SELECT count(*) FROM location_property_osmline WHERE osm_id = %s',
+                    [oid])
+        assert cur.fetchone()[0] == len(datatable) - 1
+
+    converted = [['osm_id', 'startnumber', 'endnumber', 'linegeo!wkt']]
+    start_idx = datatable[0].index('start') if 'start' in datatable[0] else None
+    end_idx = datatable[0].index('end') if 'end' in datatable[0] else None
+    geom_idx = datatable[0].index('geometry') if 'geometry' in datatable[0] else None
+    converted = [['osm_id']]
+    for val, col in zip((start_idx, end_idx, geom_idx),
+                        ('startnumber', 'endnumber', 'linegeo!wkt')):
+        if val is not None:
+            converted[0].append(col)
+
+    for line in datatable[1:]:
+        convline = [oid]
+        for val in (start_idx, end_idx):
+            if val is not None:
+                convline.append(line[val])
+        if geom_idx is not None:
+            convline.append(line[geom_idx])
+        converted.append(convline)
+
+    _rewrite_placeid_field('parent_place_id', 'parent_place_id', converted, place_ids)
+
+    check_table_content(db_conn, 'location_property_osmline', converted, grid=node_grid)
+
+
+@then(step_parse(r'W(?P<oid>\d+) expands to no interpolation'),
+      converters={'oid': int})
+def then_check_interpolation_table_negative(db_conn, oid):
+    with db_conn.cursor() as cur:
+        cur.execute("""SELECT count(*) FROM location_property_osmline
+                       WHERE osm_id = %s and startnumber is not null""",
+                    [oid])
+        assert cur.fetchone()[0] == 0
+
+
+scenarios('features/db')
diff --git a/test/bdd/test_osm2pgsql.py b/test/bdd/test_osm2pgsql.py
new file mode 100644
index 00000000..a2214b08
--- /dev/null
+++ b/test/bdd/test_osm2pgsql.py
@@ -0,0 +1,109 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Collector for BDD osm2pgsql import style tests.
+"""
+import asyncio
+import random
+
+import pytest
+from pytest_bdd import scenarios, when, then, given
+from pytest_bdd.parsers import re as step_parse
+
+from nominatim_db import cli
+from nominatim_db.tools.exec_utils import run_osm2pgsql
+from nominatim_db.tools.database_import import load_data, create_table_triggers
+from nominatim_db.tools.replication import run_osm2pgsql_updates
+
+from utils.checks import check_table_content
+
+
+@pytest.fixture
+def osm2pgsql_options(def_config):
+    return dict(osm2pgsql='osm2pgsql',
+                osm2pgsql_cache=50,
+                osm2pgsql_style=str(def_config.get_import_style_file()),
+                osm2pgsql_style_path=def_config.lib_dir.lua,
+                threads=1,
+                dsn=def_config.get_libpq_dsn(),
+                flatnode_file='',
+                tablespaces=dict(slim_data='', slim_index='',
+                                 main_data='', main_index=''),
+                append=False)
+
+
+@pytest.fixture
+def opl_writer(tmp_path, node_grid):
+    nr = [0]
+
+    def _write(data):
+        fname = tmp_path / f"test_osm_{nr[0]}.opl"
+        nr[0] += 1
+        with fname.open('wt') as fd:
+            for line in data.split('\n'):
+                if line.startswith('n') and ' x' not in line:
+                    coord = node_grid.get(line[1:].split(' ')[0]) \
+                            or (random.uniform(-180, 180), random.uniform(-90, 90))
+                    line = f"{line} x{coord[0]:.7f} y{coord[1]:.7f}"
+                fd.write(line)
+                fd.write('\n')
+        return fname
+
+    return _write
+
+
+@given('the lua style file', target_fixture='osm2pgsql_options')
+def set_lua_style_file(osm2pgsql_options, docstring, tmp_path):
+    style = tmp_path / 'custom.lua'
+    style.write_text(docstring)
+    osm2pgsql_options['osm2pgsql_style'] = str(style)
+
+    return osm2pgsql_options
+
+
+@when('loading osm data')
+def load_from_osm_file(db, osm2pgsql_options, opl_writer, docstring):
+    """ Load the given data into a freshly created test database using osm2pgsql.
+        No further indexing is done.
+
+        The data is expected as attached text in OPL format.
+    """
+    osm2pgsql_options['import_file'] = opl_writer(docstring.replace(r'//', r'/'))
+    osm2pgsql_options['append'] = False
+    run_osm2pgsql(osm2pgsql_options)
+
+
+@when('updating osm data')
+def update_from_osm_file(db_conn, def_config, osm2pgsql_options, opl_writer, docstring):
+    """ Update a database previously populated with 'loading osm data'.
+        Needs to run indexing on the existing data first to yield the correct
+        result.
+
+        The data is expected as attached text in OPL format.
+    """
+    create_table_triggers(db_conn, def_config)
+    asyncio.run(load_data(def_config.get_libpq_dsn(), 1))
+    cli.nominatim(['index'], def_config.environ)
+    cli.nominatim(['refresh', '--functions'], def_config.environ)
+
+    osm2pgsql_options['import_file'] = opl_writer(docstring.replace(r'//', r'/'))
+    run_osm2pgsql_updates(db_conn, osm2pgsql_options)
+
+
+@when('indexing')
+def do_index(def_config):
+    """ Run Nominatim's indexing step.
+    """
+    cli.nominatim(['index'], def_config.environ)
+
+
+@then(step_parse(r'(?P<table>\w+) contains(?P<exact> exactly)?'))
+def check_place_content(db_conn, datatable, node_grid, table, exact):
+    check_table_content(db_conn, table, datatable, grid=node_grid, exact=bool(exact))
+
+
+scenarios('features/osm2pgsql')
diff --git a/test/bdd/utils/__init__.py b/test/bdd/utils/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/test/bdd/utils/api_result.py b/test/bdd/utils/api_result.py
new file mode 100644
index 00000000..d21697e2
--- /dev/null
+++ b/test/bdd/utils/api_result.py
@@ -0,0 +1,133 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Wrapper for results from the API
+"""
+import json
+import xml.etree.ElementTree as ET
+
+
+class APIResult:
+
+    def __init__(self, fmt, endpoint, body):
+        getattr(self, '_parse_' + fmt)(endpoint, body)
+
+    def is_simple(self):
+        return not isinstance(self.result, list)
+
+    def __len__(self):
+        return 1 if self.is_simple() else len(self.result)
+
+    def __str__(self):
+        return json.dumps({'meta': self.meta, 'result': self.result}, indent=2)
+
+    def _parse_json(self, _, body):
+        self.meta = {}
+        self.result = json.loads(body)
+
+    def _parse_xml(self, endpoint, body):
+        xml_tree = ET.fromstring(body)
+
+        self.meta = dict(xml_tree.attrib)
+
+        if xml_tree.tag == 'reversegeocode':
+            self._parse_xml_simple(xml_tree)
+        elif xml_tree.tag == 'searchresults':
+            self._parse_xml_multi(xml_tree)
+        elif xml_tree.tag == 'error':
+            self.result = {'error': {sub.tag: sub.text for sub in xml_tree}}
+
+    def _parse_xml_simple(self, xml):
+        self.result = {}
+
+        for child in xml:
+            if child.tag == 'result':
+                assert not self.result, "More than one result in reverse result"
+                self.result.update(child.attrib)
+                assert 'display_name' not in self.result
+                self.result['display_name'] = child.text
+            elif child.tag == 'addressparts':
+                assert 'address' not in self.result
+                self.result['address'] = {sub.tag: sub.text for sub in child}
+            elif child.tag == 'extratags':
+                assert 'extratags' not in self.result
+                self.result['extratags'] = {tag.attrib['key']: tag.attrib['value'] for tag in child}
+            elif child.tag == 'namedetails':
+                assert 'namedetails' not in self.result
+                self.result['namedetails'] = {tag.attrib['desc']: tag.text for tag in child}
+            elif child.tag == 'geokml':
+                assert 'geokml' not in self.result
+                self.result['geokml'] = ET.tostring(child, encoding='unicode')
+            elif child.tag == 'error':
+                assert not self.result
+                self.result['error'] = child.text
+            else:
+                assert False, f"Unknown XML tag {child.tag} on page: {self.page}"
+
+    def _parse_xml_multi(self, xml):
+        self.result = []
+
+        for child in xml:
+            assert child.tag == "place"
+            res = dict(child.attrib)
+
+            address = {}
+            for sub in child:
+                if sub.tag == 'extratags':
+                    assert 'extratags' not in res
+                    res['extratags'] = {tag.attrib['key']: tag.attrib['value'] for tag in sub}
+                elif sub.tag == 'namedetails':
+                    assert 'namedetails' not in res
+                    res['namedetails'] = {tag.attrib['desc']: tag.text for tag in sub}
+                elif sub.tag == 'geokml':
+                    res['geokml'] = ET.tostring(sub, encoding='utf-8')
+                else:
+                    address[sub.tag] = sub.text
+
+            if address:
+                res['address'] = address
+
+            self.result.append(res)
+
+    def _parse_geojson(self, _, body):
+        geojson = json.loads(body)
+
+        assert geojson.get('type') == 'FeatureCollection'
+        assert isinstance(geojson.get('features'), list)
+
+        self.meta = {k: v for k, v in geojson.items() if k not in ('type', 'features')}
+        self.result = []
+
+        for obj in geojson['features']:
+            assert isinstance(obj, dict)
+            assert obj.get('type') == 'Feature'
+
+            assert isinstance(obj.get('properties'), dict)
+            result = obj['properties']
+            assert 'geojson' not in result
+            result['geojson'] = obj['geometry']
+            if 'bbox' in obj:
+                assert 'boundingbox' not in result
+                # bbox is  minlon, minlat, maxlon, maxlat
+                # boundingbox is minlat, maxlat, minlon, maxlon
+                result['boundingbox'] = [obj['bbox'][1], obj['bbox'][3],
+                                         obj['bbox'][0], obj['bbox'][2]]
+            self.result.append(result)
+
+    def _parse_geocodejson(self, endpoint, body):
+        self._parse_geojson(endpoint, body)
+
+        assert set(self.meta.keys()) == {'geocoding'}
+        assert isinstance(self.meta['geocoding'], dict)
+        self.meta = self.meta['geocoding']
+
+        for r in self.result:
+            assert set(r.keys()) == {'geocoding', 'geojson'}
+            inner = r.pop('geocoding')
+            assert isinstance(inner, dict)
+            assert 'geojson' not in inner
+            r.update(inner)
diff --git a/test/bdd/utils/api_runner.py b/test/bdd/utils/api_runner.py
new file mode 100644
index 00000000..d57067b3
--- /dev/null
+++ b/test/bdd/utils/api_runner.py
@@ -0,0 +1,70 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Various helper classes for running Nominatim commands.
+"""
+import asyncio
+from collections import namedtuple
+
+APIResponse = namedtuple('APIResponse', ['endpoint', 'status', 'body', 'headers'])
+
+
+class APIRunner:
+    """ Execute a call to an API endpoint.
+    """
+    def __init__(self, environ, api_engine):
+        create_func = getattr(self, f"create_engine_{api_engine}")
+        self.exec_engine = create_func(environ)
+
+    def run(self, endpoint, params, http_headers):
+        return asyncio.run(self.exec_engine(endpoint, params, http_headers))
+
+    def run_step(self, endpoint, base_params, datatable, fmt, http_headers):
+        if fmt:
+            base_params['format'] = fmt.strip()
+
+        if datatable:
+            if datatable[0] == ['param', 'value']:
+                base_params.update(datatable[1:])
+            else:
+                base_params.update(zip(datatable[0], datatable[1]))
+
+        return self.run(endpoint, base_params, http_headers)
+
+    def create_engine_falcon(self, environ):
+        import nominatim_api.server.falcon.server
+        import falcon.testing
+
+        async def exec_engine_falcon(endpoint, params, http_headers):
+            app = nominatim_api.server.falcon.server.get_application(None, environ)
+
+            async with falcon.testing.ASGIConductor(app) as conductor:
+                response = await conductor.get("/" + endpoint, params=params,
+                                               headers=http_headers)
+
+            return APIResponse(endpoint, response.status_code,
+                               response.text, response.headers)
+
+        return exec_engine_falcon
+
+    def create_engine_starlette(self, environ):
+        import nominatim_api.server.starlette.server
+        from asgi_lifespan import LifespanManager
+        import httpx
+
+        async def _request(endpoint, params, http_headers):
+            app = nominatim_api.server.starlette.server.get_application(None, environ)
+
+            async with LifespanManager(app):
+                async with httpx.AsyncClient(app=app, base_url="http://nominatim.test") as client:
+                    response = await client.get("/" + endpoint, params=params,
+                                                headers=http_headers)
+
+            return APIResponse(endpoint, response.status_code,
+                               response.text, response.headers)
+
+        return _request
diff --git a/test/bdd/utils/checks.py b/test/bdd/utils/checks.py
new file mode 100644
index 00000000..592dad69
--- /dev/null
+++ b/test/bdd/utils/checks.py
@@ -0,0 +1,237 @@
+# SPDX-License-Identifier: GPL-2.0-only
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Helper functions to compare expected values.
+"""
+import json
+import re
+import math
+
+from psycopg import sql as pysql
+from psycopg.rows import dict_row
+from .geometry_alias import ALIASES
+
+
+COMPARATOR_TERMS = {
+    'exactly': lambda exp, act: exp == act,
+    'more than': lambda exp, act: act > exp,
+    'less than': lambda exp, act: act < exp,
+}
+
+
+def _pretty(obj):
+    return json.dumps(obj, sort_keys=True, indent=2)
+
+
+def _pt_close(p1, p2):
+    return math.isclose(p1[0], p2[0], abs_tol=1e-07) \
+           and math.isclose(p1[1], p2[1], abs_tol=1e-07)
+
+
+def within_box(value, expect):
+    coord = [float(x) for x in expect.split(',')]
+
+    if isinstance(value, str):
+        if value.startswith('POINT'):
+            value = value[6:-1].split(' ')
+        else:
+            value = value.split(',')
+    value = list(map(float, value))
+
+    if len(value) == 2:
+        return coord[0] <= value[0] <= coord[2] \
+               and coord[1] <= value[1] <= coord[3]
+
+    if len(value) == 4:
+        return value[0] >= coord[0] and value[1] <= coord[1] \
+               and value[2] >= coord[2] and value[3] <= coord[3]
+
+    raise ValueError("Not a coordinate or bbox.")
+
+
+COMPARISON_FUNCS = {
+    None: lambda val, exp: str(val) == exp,
+    'i': lambda val, exp: str(val).lower() == exp.lower(),
+    'fm': lambda val, exp: re.fullmatch(exp, val) is not None,
+    'dict': lambda val, exp: val is None if exp == '-' else (val == eval('{' + exp + '}')),
+    'in_box': within_box
+}
+
+OSM_TYPE = {'node': 'n', 'way': 'w', 'relation': 'r',
+            'N': 'n', 'W': 'w', 'R': 'r'}
+
+
+class ResultAttr:
+    """ Returns the given attribute as a string.
+
+        The key parameter determines how the value is formatted before
+        returning. To refer to sub attributes, use '+' to add more keys
+        (e.g. 'name+ref' will access obj['name']['ref']). A '!' introduces
+        a formatting suffix. If no suffix is given, the value will be
+        converted using the str() function.
+
+        Available formatters:
+
+        !:...   - use a formatting expression according to Python Mini Format Spec
+        !i      - make case-insensitive comparison
+        !fm     - consider comparison string a regular expression and match full value
+        !wkt    - convert the expected value to a WKT string before comparing
+        !in_box - the expected value is a comma-separated bbox description
+    """
+
+    def __init__(self, obj, key, grid=None):
+        self.grid = grid
+        self.obj = obj
+        if '!' in key:
+            self.key, self.fmt = key.rsplit('!', 1)
+        else:
+            self.key = key
+            self.fmt = None
+
+        if self.key == 'object':
+            assert 'osm_id' in obj
+            assert 'osm_type' in obj
+            self.subobj = OSM_TYPE[obj['osm_type']] + str(obj['osm_id'])
+            self.fmt = 'i'
+        else:
+            done = ''
+            self.subobj = self.obj
+            for sub in self.key.split('+'):
+                done += f"[{sub}]"
+                assert sub in self.subobj, \
+                    f"Missing attribute {done}. Full object:\n{_pretty(self.obj)}"
+                self.subobj = self.subobj[sub]
+
+    def __eq__(self, other):
+        # work around bad quoting by pytest-bdd
+        if not isinstance(other, str):
+            return self.subobj == other
+
+        other = other.replace(r'\\', '\\')
+
+        if self.fmt in COMPARISON_FUNCS:
+            return COMPARISON_FUNCS[self.fmt](self.subobj, other)
+
+        if self.fmt.startswith(':'):
+            return other == f"{{{self.fmt}}}".format(self.subobj)
+
+        if self.fmt == 'wkt':
+            return self.compare_wkt(self.subobj, other)
+
+        raise RuntimeError(f"Unknown format string '{self.fmt}'.")
+
+    def __repr__(self):
+        k = self.key.replace('+', '][')
+        if self.fmt:
+            k += '!' + self.fmt
+        return f"result[{k}]({self.subobj})"
+
+    def compare_wkt(self, value, expected):
+        """ Compare a WKT value against a compact geometry format.
+            The function understands the following formats:
+
+              country:<country code>
+                 Point geometry guaranteed to be in the given country
+              <P>
+                 Point geometry
+              <P>,...,<P>
+                 Line geometry
+              (<P>,...,<P>)
+                 Polygon geometry
+
+           <P> may either be a coordinate of the form '<x> <y>' or a single
+           number. In the latter case it must refer to a point in
+           a previously defined grid.
+        """
+        m = re.fullmatch(r'(POINT)\(([0-9. -]*)\)', value) \
+            or re.fullmatch(r'(LINESTRING)\(([0-9,. -]*)\)', value) \
+            or re.fullmatch(r'(POLYGON)\(\(([0-9,. -]*)\)\)', value)
+        if not m:
+            return False
+
+        converted = [list(map(float, pt.split(' ', 1)))
+                     for pt in map(str.strip, m[2].split(','))]
+
+        if expected.startswith('country:'):
+            ccode = expected[8:].upper()
+            assert ccode in ALIASES, f"Geometry error: unknown country {ccode}"
+            return m[1] == 'POINT' and _pt_close(converted[0], ALIASES[ccode])
+
+        if ',' not in expected:
+            return m[1] == 'POINT' and _pt_close(converted[0], self.get_point(expected))
+
+        if '(' not in expected:
+            return m[1] == 'LINESTRING' and \
+                all(_pt_close(p1, p2) for p1, p2 in
+                    zip(converted, (self.get_point(p) for p in expected.split(','))))
+
+        if m[1] != 'POLYGON':
+            return False
+
+        # Polygon comparison is tricky because the polygons don't necessarily
+        # end at the same point or have the same winding order.
+        # Brute force all possible variants of the expected polygon
+        exp_coords = [self.get_point(p) for p in expected[1:-1].split(',')]
+        if exp_coords[0] != exp_coords[-1]:
+            raise RuntimeError(f"Invalid polygon {expected}. "
+                               "First and last point need to be the same")
+        for line in (exp_coords[:-1], exp_coords[-1:0:-1]):
+            for i in range(len(line)):
+                if all(_pt_close(p1, p2) for p1, p2 in
+                       zip(converted, line[i:] + line[:i])):
+                    return True
+
+        return False
+
+    def get_point(self, pt):
+        pt = pt.strip()
+        if ' ' in pt:
+            return list(map(float, pt.split(' ', 1)))
+
+        assert self.grid
+
+        return self.grid.get(pt)
+
+
+def check_table_content(conn, tablename, data, grid=None, exact=False):
+    lines = set(range(1, len(data)))
+
+    cols = []
+    for col in data[0]:
+        if col == 'object':
+            cols.extend(('osm_id', 'osm_type'))
+        elif '!' in col:
+            name, fmt = col.rsplit('!', 1)
+            if fmt in ('wkt', 'in_box'):
+                cols.append(f"ST_AsText({name}) as {name}")
+            else:
+                cols.append(name.split('+')[0])
+        else:
+            cols.append(col.split('+')[0])
+
+    with conn.cursor(row_factory=dict_row) as cur:
+        cur.execute(pysql.SQL(f"SELECT {','.join(cols)} FROM")
+                    + pysql.Identifier(tablename))
+
+        table_content = ''
+        for row in cur:
+            table_content += '\n' + str(row)
+            for i in lines:
+                for col, value in zip(data[0], data[i]):
+                    if ResultAttr(row, col, grid=grid) != (None if value == '-' else value):
+                        break
+                else:
+                    lines.remove(i)
+                    break
+            else:
+                assert not exact, f"Unexpected row in table {tablename}: {row}"
+
+        assert not lines, \
+               "Rows not found:\n" \
+               + '\n'.join(str(data[i]) for i in lines) \
+               + "\nTable content:\n" \
+               + table_content
diff --git a/test/bdd/utils/db.py b/test/bdd/utils/db.py
new file mode 100644
index 00000000..805b55b2
--- /dev/null
+++ b/test/bdd/utils/db.py
@@ -0,0 +1,102 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Helper functions for managing test databases.
+"""
+import asyncio
+import psycopg
+from psycopg import sql as pysql
+
+from nominatim_db.tools.database_import import setup_database_skeleton, create_tables, \
+                                               create_partition_tables, create_search_indices
+from nominatim_db.data.country_info import setup_country_tables, create_country_names
+from nominatim_db.tools.refresh import create_functions, load_address_levels_from_config
+from nominatim_db.tools.exec_utils import run_osm2pgsql
+from nominatim_db.tokenizer import factory as tokenizer_factory
+
+
+class DBManager:
+
+    def __init__(self, purge=False):
+        self.purge = purge
+
+    def check_for_db(self, dbname):
+        """ Check if the given DB already exists.
+            When the purge option is set, then an existing database will
+            be deleted and the function returns that it does not exist.
+        """
+        if self.purge:
+            self.drop_db(dbname)
+            return False
+
+        return self.exists_db(dbname)
+
+    def drop_db(self, dbname):
+        """ Drop the given database if it exists.
+        """
+        with psycopg.connect(dbname='postgres') as conn:
+            conn.autocommit = True
+            conn.execute(pysql.SQL('DROP DATABASE IF EXISTS')
+                         + pysql.Identifier(dbname))
+
+    def exists_db(self, dbname):
+        """ Check if a database with the given name exists already.
+        """
+        with psycopg.connect(dbname='postgres') as conn:
+            cur = conn.execute('select count(*) from pg_database where datname = %s',
+                               (dbname,))
+            return cur.fetchone()[0] == 1
+
+    def create_db_from_template(self, dbname, template):
+        """ Create a new database from the given template database.
+            Any existing database with the same name will be dropped.
+        """
+        with psycopg.connect(dbname='postgres') as conn:
+            conn.autocommit = True
+            conn.execute(pysql.SQL('DROP DATABASE IF EXISTS')
+                         + pysql.Identifier(dbname))
+            conn.execute(pysql.SQL('CREATE DATABASE {} WITH TEMPLATE {}')
+                              .format(pysql.Identifier(dbname),
+                                      pysql.Identifier(template)))
+
+    def setup_template_db(self, config):
+        """ Create a template DB which contains the necessary extensions
+            and basic static tables.
+
+            The template will only be created if the database does not yet
+            exist or 'purge' is set.
+        """
+        dsn = config.get_libpq_dsn()
+
+        if self.check_for_db(config.get_database_params()['dbname']):
+            return
+
+        setup_database_skeleton(dsn)
+
+        run_osm2pgsql(dict(osm2pgsql='osm2pgsql',
+                           osm2pgsql_cache=1,
+                           osm2pgsql_style=str(config.get_import_style_file()),
+                           osm2pgsql_style_path=config.lib_dir.lua,
+                           threads=1,
+                           dsn=dsn,
+                           flatnode_file='',
+                           tablespaces=dict(slim_data='', slim_index='',
+                                            main_data='', main_index=''),
+                           append=False,
+                           import_data=b'<osm version="0.6"></osm>'))
+
+        setup_country_tables(dsn, config.lib_dir.data)
+
+        with psycopg.connect(dsn) as conn:
+            create_tables(conn, config)
+            load_address_levels_from_config(conn, config)
+            create_partition_tables(conn, config)
+            create_functions(conn, config, enable_diff_updates=False)
+            asyncio.run(create_search_indices(conn, config))
+
+            tokenizer = tokenizer_factory.create_tokenizer(config)
+            create_country_names(conn, tokenizer)
diff --git a/test/bdd/utils/geometry_alias.py b/test/bdd/utils/geometry_alias.py
new file mode 100644
index 00000000..dbec5201
--- /dev/null
+++ b/test/bdd/utils/geometry_alias.py
@@ -0,0 +1,262 @@
+# SPDX-License-Identifier: GPL-2.0-only
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Collection of aliases for various world coordinates.
+"""
+
+ALIASES = {
+    # Country aliases
+    'AD': (1.58972, 42.54241),
+    'AE': (54.61589, 24.82431),
+    'AF': (65.90264, 34.84708),
+    'AG': (-61.72430, 17.069),
+    'AI': (-63.10571, 18.25461),
+    'AL': (19.84941, 40.21232),
+    'AM': (44.64229, 40.37821),
+    'AO': (16.21924, -12.77014),
+    'AQ': (44.99999, -75.65695),
+    'AR': (-61.10759, -34.37615),
+    'AS': (-170.68470, -14.29307),
+    'AT': (14.25747, 47.36542),
+    'AU': (138.23155, -23.72068),
+    'AW': (-69.98255, 12.555),
+    'AX': (19.91839, 59.81682),
+    'AZ': (48.38555, 40.61639),
+    'BA': (17.18514, 44.25582),
+    'BB': (-59.53342, 13.19),
+    'BD': (89.75989, 24.34205),
+    'BE': (4.90078, 50.34682),
+    'BF': (-0.56743, 11.90471),
+    'BG': (24.80616, 43.09859),
+    'BH': (50.52032, 25.94685),
+    'BI': (29.54561, -2.99057),
+    'BJ': (2.70062, 10.02792),
+    'BL': (-62.79349, 17.907),
+    'BM': (-64.77406, 32.30199),
+    'BN': (114.52196, 4.28638),
+    'BO': (-62.02473, -17.77723),
+    'BQ': (-63.14322, 17.566),
+    'BR': (-45.77065, -9.58685),
+    'BS': (-77.60916, 23.8745),
+    'BT': (90.01350, 27.28137),
+    'BV': (3.35744, -54.4215),
+    'BW': (23.51505, -23.48391),
+    'BY': (26.77259, 53.15885),
+    'BZ': (-88.63489, 16.33951),
+    'CA': (-107.74817, 67.12612),
+    'CC': (96.84420, -12.01734),
+    'CD': (24.09544, -1.67713),
+    'CF': (22.58701, 5.98438),
+    'CG': (15.78875, 0.40388),
+    'CH': (7.65705, 46.57446),
+    'CI': (-6.31190, 6.62783),
+    'CK': (-159.77835, -21.23349),
+    'CL': (-70.41790, -53.77189),
+    'CM': (13.26022, 5.94519),
+    'CN': (96.44285, 38.04260),
+    'CO': (-72.52951, 2.45174),
+    'CR': (-83.83314, 9.93514),
+    'CU': (-80.81673, 21.88852),
+    'CV': (-24.50810, 14.929),
+    'CW': (-68.96409, 12.1845),
+    'CX': (105.62411, -10.48417),
+    'CY': (32.95922, 35.37010),
+    'CZ': (16.32098, 49.50692),
+    'DE': (9.30716, 50.21289),
+    'DJ': (42.96904, 11.41542),
+    'DK': (9.18490, 55.98916),
+    'DM': (-61.00358, 15.65470),
+    'DO': (-69.62855, 18.58841),
+    'DZ': (4.24749, 25.79721),
+    'EC': (-77.45831, -0.98284),
+    'EE': (23.94288, 58.43952),
+    'EG': (28.95293, 28.17718),
+    'EH': (-13.69031, 25.01241),
+    'ER': (39.01223, 14.96033),
+    'ES': (-2.59110, 38.79354),
+    'ET': (38.61697, 7.71399),
+    'FI': (26.89798, 63.56194),
+    'FJ': (177.91853, -17.74237),
+    'FK': (-58.99044, -51.34509),
+    'FM': (151.95358, 8.5045),
+    'FO': (-6.60483, 62.10000),
+    'FR': (0.28410, 47.51045),
+    'GA': (10.81070, -0.07429),
+    'GB': (-0.92823, 52.01618),
+    'GD': (-61.64524, 12.191),
+    'GE': (44.16664, 42.00385),
+    'GF': (-53.46524, 3.56188),
+    'GG': (-2.50580, 49.58543),
+    'GH': (-0.46348, 7.16051),
+    'GI': (-5.32053, 36.11066),
+    'GL': (-33.85511, 74.66355),
+    'GM': (-16.40960, 13.25),
+    'GN': (-13.83940, 10.96291),
+    'GP': (-61.68712, 16.23049),
+    'GQ': (10.23973, 1.43119),
+    'GR': (23.17850, 39.06206),
+    'GS': (-36.49430, -54.43067),
+    'GT': (-90.74368, 15.20428),
+    'GU': (144.73362, 13.44413),
+    'GW': (-14.83525, 11.92486),
+    'GY': (-58.45167, 5.73698),
+    'HK': (114.18577, 22.34923),
+    'HM': (73.68230, -53.22105),
+    'HN': (-86.95414, 15.23820),
+    'HR': (17.49966, 45.52689),
+    'HT': (-73.51925, 18.32492),
+    'HU': (20.35362, 47.51721),
+    'ID': (123.34505, -0.83791),
+    'IE': (-9.00520, 52.87725),
+    'IL': (35.46314, 32.86165),
+    'IM': (-4.86740, 54.023),
+    'IN': (88.67620, 27.86155),
+    'IO': (71.42743, -6.14349),
+    'IQ': (42.58109, 34.26103),
+    'IR': (56.09355, 30.46751),
+    'IS': (-17.51785, 64.71687),
+    'IT': (10.42639, 44.87904),
+    'JE': (-2.19261, 49.12458),
+    'JM': (-76.84020, 18.3935),
+    'JO': (36.55552, 30.75741),
+    'JP': (138.72531, 35.92099),
+    'KE': (36.90602, 1.08512),
+    'KG': (76.15571, 41.66497),
+    'KH': (104.31901, 12.95555),
+    'KI': (173.63353, 0.139),
+    'KM': (44.31474, -12.241),
+    'KN': (-62.69379, 17.2555),
+    'KP': (126.65575, 39.64575),
+    'KR': (127.27740, 36.41388),
+    'KW': (47.30684, 29.69180),
+    'KY': (-81.07455, 19.29949),
+    'KZ': (72.00811, 49.88855),
+    'LA': (102.44391, 19.81609),
+    'LB': (35.48464, 33.41766),
+    'LC': (-60.97894, 13.891),
+    'LI': (9.54693, 47.15934),
+    'LK': (80.38520, 8.41649),
+    'LR': (-11.16960, 4.04122),
+    'LS': (28.66984, -29.94538),
+    'LT': (24.51735, 55.49293),
+    'LU': (6.08649, 49.81533),
+    'LV': (23.51033, 56.67144),
+    'LY': (15.36841, 28.12177),
+    'MA': (-4.03061, 33.21696),
+    'MC': (7.47743, 43.62917),
+    'MD': (29.61725, 46.66517),
+    'ME': (19.72291, 43.02441),
+    'MF': (-63.06666, 18.08102),
+    'MG': (45.86378, -20.50245),
+    'MH': (171.94982, 5.983),
+    'MK': (21.42108, 41.08980),
+    'ML': (-1.93310, 16.46993),
+    'MM': (95.54624, 21.09620),
+    'MN': (99.81138, 48.18615),
+    'MO': (113.56441, 22.16209),
+    'MP': (145.21345, 14.14902),
+    'MQ': (-60.81128, 14.43706),
+    'MR': (-9.42324, 22.59251),
+    'MS': (-62.19455, 16.745),
+    'MT': (14.38363, 35.94467),
+    'MU': (57.55121, -20.41),
+    'MV': (73.39292, 4.19375),
+    'MW': (33.95722, -12.28218),
+    'MX': (-105.89221, 25.86826),
+    'MY': (112.71154, 2.10098),
+    'MZ': (37.58689, -13.72682),
+    'NA': (16.68569, -21.46572),
+    'NC': (164.95322, -20.38889),
+    'NE': (10.06041, 19.08273),
+    'NF': (167.95718, -29.0645),
+    'NG': (10.17781, 10.17804),
+    'NI': (-85.87974, 13.21715),
+    'NL': (-68.57062, 12.041),
+    'NO': (23.11556, 70.09934),
+    'NP': (83.36259, 28.13107),
+    'NR': (166.93479, -0.5275),
+    'NU': (-169.84873, -19.05305),
+    'NZ': (167.97209, -45.13056),
+    'OM': (56.86055, 20.47413),
+    'PA': (-79.40160, 8.80656),
+    'PE': (-78.66540, -7.54711),
+    'PF': (-145.05719, -16.70862),
+    'PG': (146.64600, -7.37427),
+    'PH': (121.48359, 15.09965),
+    'PK': (72.11347, 31.14629),
+    'PL': (17.88136, 52.77182),
+    'PM': (-56.19515, 46.78324),
+    'PN': (-130.10642, -25.06955),
+    'PR': (-65.88755, 18.37169),
+    'PS': (35.39801, 32.24773),
+    'PT': (-8.45743, 40.11154),
+    'PW': (134.49645, 7.3245),
+    'PY': (-59.51787, -22.41281),
+    'QA': (51.49903, 24.99816),
+    'RE': (55.77345, -21.36388),
+    'RO': (26.37632, 45.36120),
+    'RS': (20.40371, 44.56413),
+    'RU': (116.44060, 59.06780),
+    'RW': (29.57882, -1.62404),
+    'SA': (47.73169, 22.43790),
+    'SB': (164.63894, -10.23606),
+    'SC': (46.36566, -9.454),
+    'SD': (28.14720, 14.56423),
+    'SE': (15.68667, 60.35568),
+    'SG': (103.84187, 1.304),
+    'SH': (-12.28155, -37.11546),
+    'SI': (14.04738, 46.39085),
+    'SJ': (15.27552, 79.23365),
+    'SK': (20.41603, 48.86970),
+    'SL': (-11.47773, 8.78156),
+    'SM': (12.46062, 43.94279),
+    'SN': (-15.37111, 14.99477),
+    'SO': (46.93383, 9.34094),
+    'SR': (-55.42864, 4.56985),
+    'SS': (28.13573, 8.50933),
+    'ST': (6.61025, 0.2215),
+    'SV': (-89.36665, 13.43072),
+    'SX': (-63.15393, 17.9345),
+    'SY': (38.15513, 35.34221),
+    'SZ': (31.78263, -26.14244),
+    'TC': (-71.32554, 21.35),
+    'TD': (17.42092, 13.46223),
+    'TF': (137.5, -67.5),
+    'TG': (1.06983, 7.87677),
+    'TH': (102.00877, 16.42310),
+    'TJ': (71.91349, 39.01527),
+    'TK': (-171.82603, -9.20990),
+    'TL': (126.22520, -8.72636),
+    'TM': (57.71603, 39.92534),
+    'TN': (9.04958, 34.84199),
+    'TO': (-176.99320, -23.11104),
+    'TR': (32.82002, 39.86350),
+    'TT': (-60.70793, 11.1385),
+    'TV': (178.77499, -9.41685),
+    'TW': (120.30074, 23.17002),
+    'TZ': (33.53892, -5.01840),
+    'UA': (33.44335, 49.30619),
+    'UG': (32.96523, 2.08584),
+    'UM': (-169.50993, 16.74605),
+    'US': (-116.39535, 40.71379),
+    'UY': (-56.46505, -33.62658),
+    'UZ': (61.35529, 42.96107),
+    'VA': (12.33197, 42.04931),
+    'VC': (-61.09905, 13.316),
+    'VE': (-64.88323, 7.69849),
+    'VG': (-64.62479, 18.419),
+    'VI': (-64.88950, 18.32263),
+    'VN': (104.20179, 10.27644),
+    'VU': (167.31919, -15.88687),
+    'WF': (-176.20781, -13.28535),
+    'WS': (-172.10966, -13.85093),
+    'YE': (45.94562, 16.16338),
+    'YT': (44.93774, -12.60882),
+    'ZA': (23.19488, -30.43276),
+    'ZM': (26.38618, -14.39966),
+    'ZW': (30.12419, -19.86907)
+    }
diff --git a/test/bdd/utils/grid.py b/test/bdd/utils/grid.py
new file mode 100644
index 00000000..50355a1b
--- /dev/null
+++ b/test/bdd/utils/grid.py
@@ -0,0 +1,46 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+A grid describing node placement in an area.
+Useful for visually describing geometries.
+"""
+
+
+class Grid:
+
+    def __init__(self, table, step, origin):
+        if step is None:
+            step = 0.00001
+        if origin is None:
+            origin = (0.0, 0.0)
+        self.grid = {}
+
+        y = origin[1]
+        for line in table:
+            x = origin[0]
+            for pt_id in line:
+                if pt_id:
+                    self.grid[pt_id] = (x, y)
+                x += step
+            y += step
+
+    def get(self, nodeid):
+        """ Get the coordinates for the given grid node.
+        """
+        return self.grid.get(nodeid)
+
+    def parse_point(self, value):
+        """ Get the coordinates for either a grid node or a full coordinate.
+        """
+        value = value.strip()
+        if ' ' in value:
+            return [float(v) for v in value.split(' ', 1)]
+
+        return self.grid.get(value)
+
+    def parse_line(self, value):
+        return [self.parse_point(p) for p in value.split(',')]
diff --git a/test/bdd/steps/place_inserter.py b/test/bdd/utils/place_inserter.py
similarity index 63%
rename from test/bdd/steps/place_inserter.py
rename to test/bdd/utils/place_inserter.py
index c033ac17..a330c3ac 100644
--- a/test/bdd/steps/place_inserter.py
+++ b/test/bdd/utils/place_inserter.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2022 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Helper classes for filling the place table.
@@ -10,27 +10,32 @@ Helper classes for filling the place table.
 import random
 import string
 
+from .geometry_alias import ALIASES
+
+
 class PlaceColumn:
-    """ Helper class to collect contents from a behave table row and
+    """ Helper class to collect contents from a BDD table row and
         insert it into the place table.
     """
-    def __init__(self, context):
-        self.columns = {'admin_level' : 15}
-        self.context = context
+    def __init__(self, grid=None):
+        self.columns = {'admin_level': 15}
+        self.grid = grid
         self.geometry = None
 
-    def add_row(self, row, force_name):
+    def add_row(self, headings, row, force_name):
         """ Parse the content from the given behave row as place column data.
         """
-        for name, value in zip(row.headings, row.cells):
+        for name, value in zip(headings, row):
             self._add(name, value)
 
         assert 'osm_type' in self.columns, "osm column missing"
 
         if force_name and 'name' not in self.columns:
-            self._add_hstore('name', 'name',
-                             ''.join(random.choice(string.printable)
-                                     for _ in range(int(random.random()*30))))
+            self._add_hstore(
+                'name',
+                'name',
+                ''.join(random.choices(string.printable, k=random.randrange(30))),
+            )
 
         return self
 
@@ -83,8 +88,29 @@ class PlaceColumn:
             self._add_hstore('address', 'country', value)
 
     def _set_key_geometry(self, value):
-        self.geometry = self.context.osm.parse_geometry(value)
-        assert self.geometry is not None, "Bad geometry: {}".format(value)
+        if value.startswith('country:'):
+            ccode = value[8:].upper()
+            self.geometry = "ST_SetSRID(ST_Point({}, {}), 4326)".format(*ALIASES[ccode])
+        elif ',' not in value:
+            if self.grid:
+                pt = self.grid.parse_point(value)
+            else:
+                pt = value.split(' ')
+            self.geometry = f"ST_SetSRID(ST_Point({pt[0]}, {pt[1]}), 4326)"
+        elif '(' not in value:
+            if self.grid:
+                coords = ','.join(' '.join(f"{p:.7f}" for p in pt)
+                                  for pt in self.grid.parse_line(value))
+            else:
+                coords = value
+            self.geometry = f"'srid=4326;LINESTRING({coords})'::geometry"
+        else:
+            if self.grid:
+                coords = ','.join(' '.join(f"{p:.7f}" for p in pt)
+                                  for pt in self.grid.parse_line(value[1:-1]))
+            else:
+                coords = value[1:-1]
+            self.geometry = f"'srid=4326;POLYGON(({coords}))'::geometry"
 
     def _add_hstore(self, column, key, value):
         if column in self.columns:
@@ -96,17 +122,17 @@ class PlaceColumn:
         """ Issue a delete for the given OSM object.
         """
         cursor.execute('DELETE FROM place WHERE osm_type = %s and osm_id = %s',
-                       (self.columns['osm_type'] , self.columns['osm_id']))
+                       (self.columns['osm_type'], self.columns['osm_id']))
 
     def db_insert(self, cursor):
         """ Insert the collected data into the database.
         """
         if self.columns['osm_type'] == 'N' and self.geometry is None:
-            pt = self.context.osm.grid_node(self.columns['osm_id'])
+            pt = self.grid.get(str(self.columns['osm_id'])) if self.grid else None
             if pt is None:
-                pt = (random.random()*360 - 180, random.random()*180 - 90)
+                pt = (random.uniform(-180, 180), random.uniform(-90, 90))
 
-            self.geometry = "ST_SetSRID(ST_Point(%f, %f), 4326)" % pt
+            self.geometry = "ST_SetSRID(ST_Point({}, {}), 4326)".format(*pt)
         else:
             assert self.geometry is not None, "Geometry missing"
 
diff --git a/test/python/api/conftest.py b/test/python/api/conftest.py
index 3ca0720b..944e66cb 100644
--- a/test/python/api/conftest.py
+++ b/test/python/api/conftest.py
@@ -2,14 +2,13 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Helper fixtures for API call tests.
 """
 import pytest
 import pytest_asyncio
-import time
 import datetime as dt
 
 import sqlalchemy as sa
@@ -20,27 +19,25 @@ from nominatim_api.search.query_analyzer_factory import make_query_analyzer
 from nominatim_db.tools import convert_sqlite
 import nominatim_api.logging as loglib
 
+
 class APITester:
 
     def __init__(self):
         self.api = napi.NominatimAPI()
         self.async_to_sync(self.api._async_api.setup_database())
 
-
     def async_to_sync(self, func):
         """ Run an asynchronous function until completion using the
             internal loop of the API.
         """
         return self.api._loop.run_until_complete(func)
 
-
     def add_data(self, table, data):
         """ Insert data into the given table.
         """
         sql = getattr(self.api._async_api._tables, table).insert()
         self.async_to_sync(self.exec_async(sql, data))
 
-
     def add_placex(self, **kw):
         name = kw.get('name')
         if isinstance(name, str):
@@ -50,30 +47,29 @@ class APITester:
         geometry = kw.get('geometry', 'POINT(%f %f)' % centroid)
 
         self.add_data('placex',
-                     {'place_id': kw.get('place_id', 1000),
-                      'osm_type': kw.get('osm_type', 'W'),
-                      'osm_id': kw.get('osm_id', 4),
-                      'class_': kw.get('class_', 'highway'),
-                      'type': kw.get('type', 'residential'),
-                      'name': name,
-                      'address': kw.get('address'),
-                      'extratags': kw.get('extratags'),
-                      'parent_place_id': kw.get('parent_place_id'),
-                      'linked_place_id': kw.get('linked_place_id'),
-                      'admin_level': kw.get('admin_level', 15),
-                      'country_code': kw.get('country_code'),
-                      'housenumber': kw.get('housenumber'),
-                      'postcode': kw.get('postcode'),
-                      'wikipedia': kw.get('wikipedia'),
-                      'rank_search': kw.get('rank_search', 30),
-                      'rank_address': kw.get('rank_address', 30),
-                      'importance': kw.get('importance'),
-                      'centroid': 'POINT(%f %f)' % centroid,
-                      'indexed_status': kw.get('indexed_status', 0),
-                      'indexed_date': kw.get('indexed_date',
-                                             dt.datetime(2022, 12, 7, 14, 14, 46, 0)),
-                      'geometry': geometry})
-
+                      {'place_id': kw.get('place_id', 1000),
+                       'osm_type': kw.get('osm_type', 'W'),
+                       'osm_id': kw.get('osm_id', 4),
+                       'class_': kw.get('class_', 'highway'),
+                       'type': kw.get('type', 'residential'),
+                       'name': name,
+                       'address': kw.get('address'),
+                       'extratags': kw.get('extratags'),
+                       'parent_place_id': kw.get('parent_place_id'),
+                       'linked_place_id': kw.get('linked_place_id'),
+                       'admin_level': kw.get('admin_level', 15),
+                       'country_code': kw.get('country_code'),
+                       'housenumber': kw.get('housenumber'),
+                       'postcode': kw.get('postcode'),
+                       'wikipedia': kw.get('wikipedia'),
+                       'rank_search': kw.get('rank_search', 30),
+                       'rank_address': kw.get('rank_address', 30),
+                       'importance': kw.get('importance'),
+                       'centroid': 'POINT(%f %f)' % centroid,
+                       'indexed_status': kw.get('indexed_status', 0),
+                       'indexed_date': kw.get('indexed_date',
+                                              dt.datetime(2022, 12, 7, 14, 14, 46, 0)),
+                       'geometry': geometry})
 
     def add_address_placex(self, object_id, **kw):
         self.add_placex(**kw)
@@ -85,46 +81,42 @@ class APITester:
                        'fromarea': kw.get('fromarea', False),
                        'isaddress': kw.get('isaddress', True)})
 
-
     def add_osmline(self, **kw):
         self.add_data('osmline',
-                     {'place_id': kw.get('place_id', 10000),
-                      'osm_id': kw.get('osm_id', 4004),
-                      'parent_place_id': kw.get('parent_place_id'),
-                      'indexed_date': kw.get('indexed_date',
-                                             dt.datetime(2022, 12, 7, 14, 14, 46, 0)),
-                      'startnumber': kw.get('startnumber', 2),
-                      'endnumber': kw.get('endnumber', 6),
-                      'step': kw.get('step', 2),
-                      'address': kw.get('address'),
-                      'postcode': kw.get('postcode'),
-                      'country_code': kw.get('country_code'),
-                      'linegeo': kw.get('geometry', 'LINESTRING(1.1 -0.2, 1.09 -0.22)')})
-
+                      {'place_id': kw.get('place_id', 10000),
+                       'osm_id': kw.get('osm_id', 4004),
+                       'parent_place_id': kw.get('parent_place_id'),
+                       'indexed_date': kw.get('indexed_date',
+                                              dt.datetime(2022, 12, 7, 14, 14, 46, 0)),
+                       'startnumber': kw.get('startnumber', 2),
+                       'endnumber': kw.get('endnumber', 6),
+                       'step': kw.get('step', 2),
+                       'address': kw.get('address'),
+                       'postcode': kw.get('postcode'),
+                       'country_code': kw.get('country_code'),
+                       'linegeo': kw.get('geometry', 'LINESTRING(1.1 -0.2, 1.09 -0.22)')})
 
     def add_tiger(self, **kw):
         self.add_data('tiger',
-                     {'place_id': kw.get('place_id', 30000),
-                      'parent_place_id': kw.get('parent_place_id'),
-                      'startnumber': kw.get('startnumber', 2),
-                      'endnumber': kw.get('endnumber', 6),
-                      'step': kw.get('step', 2),
-                      'postcode': kw.get('postcode'),
-                      'linegeo': kw.get('geometry', 'LINESTRING(1.1 -0.2, 1.09 -0.22)')})
-
+                      {'place_id': kw.get('place_id', 30000),
+                       'parent_place_id': kw.get('parent_place_id'),
+                       'startnumber': kw.get('startnumber', 2),
+                       'endnumber': kw.get('endnumber', 6),
+                       'step': kw.get('step', 2),
+                       'postcode': kw.get('postcode'),
+                       'linegeo': kw.get('geometry', 'LINESTRING(1.1 -0.2, 1.09 -0.22)')})
 
     def add_postcode(self, **kw):
         self.add_data('postcode',
-                     {'place_id': kw.get('place_id', 1000),
-                      'parent_place_id': kw.get('parent_place_id'),
-                      'country_code': kw.get('country_code'),
-                      'postcode': kw.get('postcode'),
-                      'rank_search': kw.get('rank_search', 20),
-                      'rank_address': kw.get('rank_address', 22),
-                      'indexed_date': kw.get('indexed_date',
-                                             dt.datetime(2022, 12, 7, 14, 14, 46, 0)),
-                      'geometry': kw.get('geometry', 'POINT(23 34)')})
-
+                      {'place_id': kw.get('place_id', 1000),
+                       'parent_place_id': kw.get('parent_place_id'),
+                       'country_code': kw.get('country_code'),
+                       'postcode': kw.get('postcode'),
+                       'rank_search': kw.get('rank_search', 20),
+                       'rank_address': kw.get('rank_address', 22),
+                       'indexed_date': kw.get('indexed_date',
+                                              dt.datetime(2022, 12, 7, 14, 14, 46, 0)),
+                       'geometry': kw.get('geometry', 'POINT(23 34)')})
 
     def add_country(self, country_code, geometry):
         self.add_data('country_grid',
@@ -132,14 +124,12 @@ class APITester:
                        'area': 0.1,
                        'geometry': geometry})
 
-
     def add_country_name(self, country_code, names, partition=0):
         self.add_data('country_name',
                       {'country_code': country_code,
                        'name': names,
                        'partition': partition})
 
-
     def add_search_name(self, place_id, **kw):
         centroid = kw.get('centroid', (23.0, 34.0))
         self.add_data('search_name',
@@ -152,7 +142,6 @@ class APITester:
                        'country_code': kw.get('country_code', 'xx'),
                        'centroid': 'POINT(%f %f)' % centroid})
 
-
     def add_class_type_table(self, cls, typ):
         self.async_to_sync(
             self.exec_async(sa.text(f"""CREATE TABLE place_classtype_{cls}_{typ}
@@ -160,7 +149,6 @@ class APITester:
                                              WHERE class = '{cls}' AND type = '{typ}')
                                      """)))
 
-
     def add_word_table(self, content):
         data = [dict(zip(['word_id', 'word_token', 'type', 'word', 'info'], c))
                 for c in content]
@@ -176,12 +164,10 @@ class APITester:
 
         self.async_to_sync(_do_sql())
 
-
     async def exec_async(self, sql, *args, **kwargs):
         async with self.api._async_api.begin() as conn:
             return await conn.execute(sql, *args, **kwargs)
 
-
     async def create_tables(self):
         async with self.api._async_api._engine.begin() as conn:
             await conn.run_sync(self.api._async_api._tables.meta.create_all)
@@ -206,17 +192,18 @@ def apiobj(temp_db_with_extensions, temp_db_conn, monkeypatch):
 
 
 @pytest.fixture(params=['postgres_db', 'sqlite_db'])
-def frontend(request, event_loop, tmp_path):
+def frontend(request, tmp_path):
     testapis = []
     if request.param == 'sqlite_db':
         db = str(tmp_path / 'test_nominatim_python_unittest.sqlite')
 
         def mkapi(apiobj, options={'reverse'}):
-            apiobj.add_data('properties',
-                        [{'property': 'tokenizer', 'value': 'icu'},
-                         {'property': 'tokenizer_import_normalisation', 'value': ':: lower();'},
-                         {'property': 'tokenizer_import_transliteration', 'value': "'1' > '/1/'; 'Ã¤' > 'Ã¤ '"},
-                        ])
+            apiobj.add_data(
+                'properties',
+                [{'property': 'tokenizer', 'value': 'icu'},
+                 {'property': 'tokenizer_import_normalisation', 'value': ':: lower();'},
+                 {'property': 'tokenizer_import_transliteration',
+                  'value': "'1' > '/1/'; 'Ã¤' > 'Ã¤ '"}])
 
             async def _do_sql():
                 async with apiobj.api._async_api.begin() as conn:
@@ -228,7 +215,7 @@ def frontend(request, event_loop, tmp_path):
 
             apiobj.async_to_sync(_do_sql())
 
-            event_loop.run_until_complete(convert_sqlite.convert(None, db, options))
+            apiobj.async_to_sync(convert_sqlite.convert(None, db, options))
             outapi = napi.NominatimAPI(environ={'NOMINATIM_DATABASE_DSN': f"sqlite:dbname={db}",
                                                 'NOMINATIM_USE_US_TIGER_DATA': 'yes'})
             testapis.append(outapi)
diff --git a/test/python/api/fake_adaptor.py b/test/python/api/fake_adaptor.py
index 4b64c17d..a3a3bcf9 100644
--- a/test/python/api/fake_adaptor.py
+++ b/test/python/api/fake_adaptor.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Provides dummy implementations of ASGIAdaptor for testing.
@@ -13,6 +13,7 @@ import nominatim_api.v1.server_glue as glue
 from nominatim_api.v1.format import dispatch as formatting
 from nominatim_api.config import Configuration
 
+
 class FakeError(BaseException):
 
     def __init__(self, msg, status):
@@ -22,8 +23,10 @@ class FakeError(BaseException):
     def __str__(self):
         return f'{self.status} -- {self.msg}'
 
+
 FakeResponse = namedtuple('FakeResponse', ['status', 'output', 'content_type'])
 
+
 class FakeAdaptor(glue.ASGIAdaptor):
 
     def __init__(self, params=None, headers=None, config=None):
@@ -31,23 +34,18 @@ class FakeAdaptor(glue.ASGIAdaptor):
         self.headers = headers or {}
         self._config = config or Configuration(None)
 
-
     def get(self, name, default=None):
         return self.params.get(name, default)
 
-
     def get_header(self, name, default=None):
         return self.headers.get(name, default)
 
-
     def error(self, msg, status=400):
         return FakeError(msg, status)
 
-
     def create_response(self, status, output, num_results):
         return FakeResponse(status, output, self.content_type)
 
-
     def base_uri(self):
         return 'http://test'
 
@@ -56,5 +54,3 @@ class FakeAdaptor(glue.ASGIAdaptor):
 
     def formatting(self):
         return formatting
-
-
diff --git a/test/python/api/query_processing/test_normalize.py b/test/python/api/query_processing/test_normalize.py
new file mode 100644
index 00000000..35f5fcd7
--- /dev/null
+++ b/test/python/api/query_processing/test_normalize.py
@@ -0,0 +1,31 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Tests for normalizing search queries.
+"""
+from icu import Transliterator
+
+import nominatim_api.search.query as qmod
+from nominatim_api.query_preprocessing.config import QueryConfig
+from nominatim_api.query_preprocessing import normalize
+
+
+def run_preprocessor_on(query, norm):
+    normalizer = Transliterator.createFromRules("normalization", norm)
+    proc = normalize.create(QueryConfig().set_normalizer(normalizer))
+
+    return proc(query)
+
+
+def test_normalize_simple():
+    norm = ':: lower();'
+    query = [qmod.Phrase(qmod.PHRASE_ANY, 'Hallo')]
+
+    out = run_preprocessor_on(query, norm)
+
+    assert len(out) == 1
+    assert out == [qmod.Phrase(qmod.PHRASE_ANY, 'hallo')]
diff --git a/test/python/api/query_processing/test_regex_replace.py b/test/python/api/query_processing/test_regex_replace.py
new file mode 100644
index 00000000..ef759ba1
--- /dev/null
+++ b/test/python/api/query_processing/test_regex_replace.py
@@ -0,0 +1,49 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+'''
+Tests for replacing values in an input using custom regex.
+'''
+import pytest
+
+import nominatim_api.search.query as qmod
+from nominatim_api.query_preprocessing.config import QueryConfig
+from nominatim_api.query_preprocessing import regex_replace
+
+
+def run_preprocessor_on(query):
+    config = QueryConfig()
+    config.set_normalizer(None)
+
+    config['replacements'] = [
+        {'pattern': r'\b(?:\d{1,3}\.){3}\d{1,3}\b', 'replace': ''},  # IPv4
+        {'pattern': r'https?://\S+', 'replace': ''}  # HTTP/HTTPS URLs
+    ]
+
+    proc = regex_replace.create(config)
+    return proc(query)
+
+
+@pytest.mark.parametrize('inp,outp', [
+    (['45.67.89.101'], []),
+    (['198.51.100.23'], []),
+    (['203.0.113.255'], []),
+    (['http://www.openstreetmap.org'], []),
+    (['https://www.openstreetmap.org/edit'], []),
+    (['http://osm.org'], []),
+    (['https://www.openstreetmap.org/user/abc'], []),
+    (['https://tile.openstreetmap.org/12/2048/2048.png'], []),
+    (['Check the map at https://www.openstreetmap.org'], ['Check the map at ']),
+    (['Use 203.0.113.255 for routing'], ['Use  for routing']),
+    (['Find maps at https://osm.org and http://openstreetmap.org'], ['Find maps at  and ']),
+    (['203.0.113.255', 'Some Address'], ['Some Address']),
+    (['https://osm.org', 'Another Place'], ['Another Place']),
+])
+def test_split_phrases(inp, outp):
+    query = [qmod.Phrase(qmod.PHRASE_ANY, text) for text in inp]
+
+    out = run_preprocessor_on(query)
+    assert out == [qmod.Phrase(qmod.PHRASE_ANY, text) for text in outp]
diff --git a/test/python/api/query_processing/test_split_japanese_phrases.py b/test/python/api/query_processing/test_split_japanese_phrases.py
new file mode 100644
index 00000000..30f22e7b
--- /dev/null
+++ b/test/python/api/query_processing/test_split_japanese_phrases.py
@@ -0,0 +1,31 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Tests for japanese phrase splitting.
+"""
+import pytest
+
+import nominatim_api.search.query as qmod
+from nominatim_api.query_preprocessing.config import QueryConfig
+from nominatim_api.query_preprocessing import split_japanese_phrases
+
+
+def run_preprocessor_on(query):
+    proc = split_japanese_phrases.create(QueryConfig().set_normalizer(None))
+
+    return proc(query)
+
+
+@pytest.mark.parametrize('inp,outp', [('å¤§éªåºå¤§éªå¸å¤§éª', 'å¤§éªåº:å¤§éªå¸:å¤§éª'),
+                                      ('å¤§éªåºå¤§éª', 'å¤§éªåº:å¤§éª'),
+                                      ('å¤§éªå¸å¤§éª', 'å¤§éªå¸:å¤§éª')])
+def test_split_phrases(inp, outp):
+    query = [qmod.Phrase(qmod.PHRASE_ANY, inp)]
+
+    out = run_preprocessor_on(query)
+
+    assert out == [qmod.Phrase(qmod.PHRASE_ANY, outp)]
diff --git a/test/python/api/search/test_api_search_query.py b/test/python/api/search/test_api_search_query.py
index 71caf5b7..ea3b9772 100644
--- a/test/python/api/search/test_api_search_query.py
+++ b/test/python/api/search/test_api_search_query.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for tokenized query data structures.
@@ -11,6 +11,7 @@ import pytest
 
 from nominatim_api.search import query
 
+
 class MyToken(query.Token):
 
     def get_category(self):
@@ -22,42 +23,42 @@ def mktoken(tid: int):
                    lookup_word='foo')
 
 
-@pytest.mark.parametrize('ptype,ttype', [('NONE', 'WORD'),
-                                         ('AMENITY', 'QUALIFIER'),
-                                         ('STREET', 'PARTIAL'),
-                                         ('CITY', 'WORD'),
-                                         ('COUNTRY', 'COUNTRY'),
-                                         ('POSTCODE', 'POSTCODE')])
+@pytest.fixture
+def qnode():
+    return query.QueryNode(query.BREAK_PHRASE, query.PHRASE_ANY, 0.0, '', '')
+
+
+@pytest.mark.parametrize('ptype,ttype', [(query.PHRASE_ANY, 'W'),
+                                         (query.PHRASE_AMENITY, 'Q'),
+                                         (query.PHRASE_STREET, 'w'),
+                                         (query.PHRASE_CITY, 'W'),
+                                         (query.PHRASE_COUNTRY, 'C'),
+                                         (query.PHRASE_POSTCODE, 'P')])
 def test_phrase_compatible(ptype, ttype):
-    assert query.PhraseType[ptype].compatible_with(query.TokenType[ttype], False)
+    assert query._phrase_compatible_with(ptype, ttype, False)
 
 
-@pytest.mark.parametrize('ptype', ['COUNTRY', 'POSTCODE'])
+@pytest.mark.parametrize('ptype', [query.PHRASE_COUNTRY, query.PHRASE_POSTCODE])
 def test_phrase_incompatible(ptype):
-    assert not query.PhraseType[ptype].compatible_with(query.TokenType.PARTIAL, True)
+    assert not query._phrase_compatible_with(ptype, query.TOKEN_PARTIAL, True)
 
 
-def test_query_node_empty():
-    qn = query.QueryNode(query.BreakType.PHRASE, query.PhraseType.NONE)
+def test_query_node_empty(qnode):
+    assert qnode.get_tokens(3, query.TOKEN_WORD) is None
 
-    assert not qn.has_tokens(3, query.TokenType.PARTIAL)
-    assert qn.get_tokens(3, query.TokenType.WORD) is None
 
+def test_query_node_with_content(qnode):
+    qnode.starting.append(query.TokenList(2, query.TOKEN_PARTIAL, [mktoken(100), mktoken(101)]))
+    qnode.starting.append(query.TokenList(2, query.TOKEN_WORD, [mktoken(1000)]))
 
-def test_query_node_with_content():
-    qn = query.QueryNode(query.BreakType.PHRASE, query.PhraseType.NONE)
-    qn.starting.append(query.TokenList(2, query.TokenType.PARTIAL, [mktoken(100), mktoken(101)]))
-    qn.starting.append(query.TokenList(2, query.TokenType.WORD, [mktoken(1000)]))
+    assert not qnode.has_tokens(3, query.TOKEN_PARTIAL)
+    assert not qnode.has_tokens(2, query.TOKEN_COUNTRY)
+    assert qnode.has_tokens(2, query.TOKEN_PARTIAL)
+    assert qnode.has_tokens(2, query.TOKEN_WORD)
 
-    assert not qn.has_tokens(3, query.TokenType.PARTIAL)
-    assert not qn.has_tokens(2, query.TokenType.COUNTRY)
-    assert qn.has_tokens(2, query.TokenType.PARTIAL)
-    assert qn.has_tokens(2, query.TokenType.WORD)
-
-    assert qn.get_tokens(3, query.TokenType.PARTIAL) is None
-    assert qn.get_tokens(2, query.TokenType.COUNTRY) is None
-    assert len(qn.get_tokens(2, query.TokenType.PARTIAL)) == 2
-    assert len(qn.get_tokens(2, query.TokenType.WORD)) == 1
+    assert qnode.get_tokens(2, query.TOKEN_COUNTRY) is None
+    assert len(qnode.get_tokens(2, query.TOKEN_PARTIAL)) == 2
+    assert len(qnode.get_tokens(2, query.TOKEN_WORD)) == 1
 
 
 def test_query_struct_empty():
@@ -67,21 +68,21 @@ def test_query_struct_empty():
 
 
 def test_query_struct_with_tokens():
-    q = query.QueryStruct([query.Phrase(query.PhraseType.NONE, 'foo bar')])
-    q.add_node(query.BreakType.WORD, query.PhraseType.NONE)
-    q.add_node(query.BreakType.END, query.PhraseType.NONE)
+    q = query.QueryStruct([query.Phrase(query.PHRASE_ANY, 'foo bar')])
+    q.add_node(query.BREAK_WORD, query.PHRASE_ANY)
+    q.add_node(query.BREAK_END, query.PHRASE_ANY)
 
     assert q.num_token_slots() == 2
 
-    q.add_token(query.TokenRange(0, 1), query.TokenType.PARTIAL, mktoken(1))
-    q.add_token(query.TokenRange(1, 2), query.TokenType.PARTIAL, mktoken(2))
-    q.add_token(query.TokenRange(1, 2), query.TokenType.WORD, mktoken(99))
-    q.add_token(query.TokenRange(1, 2), query.TokenType.WORD, mktoken(98))
+    q.add_token(query.TokenRange(0, 1), query.TOKEN_PARTIAL, mktoken(1))
+    q.add_token(query.TokenRange(1, 2), query.TOKEN_PARTIAL, mktoken(2))
+    q.add_token(query.TokenRange(1, 2), query.TOKEN_WORD, mktoken(99))
+    q.add_token(query.TokenRange(1, 2), query.TOKEN_WORD, mktoken(98))
 
-    assert q.get_tokens(query.TokenRange(0, 2), query.TokenType.WORD) == []
-    assert len(q.get_tokens(query.TokenRange(1, 2), query.TokenType.WORD)) == 2
+    assert q.get_tokens(query.TokenRange(0, 2), query.TOKEN_WORD) == []
+    assert len(q.get_tokens(query.TokenRange(1, 2), query.TOKEN_WORD)) == 2
 
-    partials = q.get_partials_list(query.TokenRange(0, 2))
+    partials = list(q.iter_partials(query.TokenRange(0, 2)))
 
     assert len(partials) == 2
     assert [t.token for t in partials] == [1, 2]
@@ -91,45 +92,43 @@ def test_query_struct_with_tokens():
 
 
 def test_query_struct_incompatible_token():
-    q = query.QueryStruct([query.Phrase(query.PhraseType.COUNTRY, 'foo bar')])
-    q.add_node(query.BreakType.WORD, query.PhraseType.COUNTRY)
-    q.add_node(query.BreakType.END, query.PhraseType.NONE)
+    q = query.QueryStruct([query.Phrase(query.PHRASE_COUNTRY, 'foo bar')])
+    q.add_node(query.BREAK_WORD, query.PHRASE_COUNTRY)
+    q.add_node(query.BREAK_END, query.PHRASE_ANY)
 
-    q.add_token(query.TokenRange(0, 1), query.TokenType.PARTIAL, mktoken(1))
-    q.add_token(query.TokenRange(1, 2), query.TokenType.COUNTRY, mktoken(100))
+    q.add_token(query.TokenRange(0, 1), query.TOKEN_PARTIAL, mktoken(1))
+    q.add_token(query.TokenRange(1, 2), query.TOKEN_COUNTRY, mktoken(100))
 
-    assert q.get_tokens(query.TokenRange(0, 1), query.TokenType.PARTIAL) == []
-    assert len(q.get_tokens(query.TokenRange(1, 2), query.TokenType.COUNTRY)) == 1
+    assert len(q.get_tokens(query.TokenRange(1, 2), query.TOKEN_COUNTRY)) == 1
 
 
 def test_query_struct_amenity_single_word():
-    q = query.QueryStruct([query.Phrase(query.PhraseType.AMENITY, 'bar')])
-    q.add_node(query.BreakType.END, query.PhraseType.NONE)
+    q = query.QueryStruct([query.Phrase(query.PHRASE_AMENITY, 'bar')])
+    q.add_node(query.BREAK_END, query.PHRASE_ANY)
 
-    q.add_token(query.TokenRange(0, 1), query.TokenType.PARTIAL, mktoken(1))
-    q.add_token(query.TokenRange(0, 1), query.TokenType.NEAR_ITEM, mktoken(2))
-    q.add_token(query.TokenRange(0, 1), query.TokenType.QUALIFIER, mktoken(3))
+    q.add_token(query.TokenRange(0, 1), query.TOKEN_PARTIAL, mktoken(1))
+    q.add_token(query.TokenRange(0, 1), query.TOKEN_NEAR_ITEM, mktoken(2))
+    q.add_token(query.TokenRange(0, 1), query.TOKEN_QUALIFIER, mktoken(3))
 
-    assert len(q.get_tokens(query.TokenRange(0, 1), query.TokenType.PARTIAL)) == 1
-    assert len(q.get_tokens(query.TokenRange(0, 1), query.TokenType.NEAR_ITEM)) == 1
-    assert len(q.get_tokens(query.TokenRange(0, 1), query.TokenType.QUALIFIER)) == 0
+    assert q.nodes[0].partial.token == 1
+    assert len(q.get_tokens(query.TokenRange(0, 1), query.TOKEN_NEAR_ITEM)) == 1
+    assert len(q.get_tokens(query.TokenRange(0, 1), query.TOKEN_QUALIFIER)) == 0
 
 
 def test_query_struct_amenity_two_words():
-    q = query.QueryStruct([query.Phrase(query.PhraseType.AMENITY, 'foo bar')])
-    q.add_node(query.BreakType.WORD, query.PhraseType.AMENITY)
-    q.add_node(query.BreakType.END, query.PhraseType.NONE)
+    q = query.QueryStruct([query.Phrase(query.PHRASE_AMENITY, 'foo bar')])
+    q.add_node(query.BREAK_WORD, query.PHRASE_AMENITY)
+    q.add_node(query.BREAK_END, query.PHRASE_ANY)
 
     for trange in [(0, 1), (1, 2)]:
-        q.add_token(query.TokenRange(*trange), query.TokenType.PARTIAL, mktoken(1))
-        q.add_token(query.TokenRange(*trange), query.TokenType.NEAR_ITEM, mktoken(2))
-        q.add_token(query.TokenRange(*trange), query.TokenType.QUALIFIER, mktoken(3))
-
-    assert len(q.get_tokens(query.TokenRange(0, 1), query.TokenType.PARTIAL)) == 1
-    assert len(q.get_tokens(query.TokenRange(0, 1), query.TokenType.NEAR_ITEM)) == 0
-    assert len(q.get_tokens(query.TokenRange(0, 1), query.TokenType.QUALIFIER)) == 1
+        q.add_token(query.TokenRange(*trange), query.TOKEN_PARTIAL, mktoken(1))
+        q.add_token(query.TokenRange(*trange), query.TOKEN_NEAR_ITEM, mktoken(2))
+        q.add_token(query.TokenRange(*trange), query.TOKEN_QUALIFIER, mktoken(3))
 
-    assert len(q.get_tokens(query.TokenRange(1, 2), query.TokenType.PARTIAL)) == 1
-    assert len(q.get_tokens(query.TokenRange(1, 2), query.TokenType.NEAR_ITEM)) == 0
-    assert len(q.get_tokens(query.TokenRange(1, 2), query.TokenType.QUALIFIER)) == 1
+    assert q.nodes[0].partial.token == 1
+    assert len(q.get_tokens(query.TokenRange(0, 1), query.TOKEN_NEAR_ITEM)) == 0
+    assert len(q.get_tokens(query.TokenRange(0, 1), query.TOKEN_QUALIFIER)) == 1
 
+    assert q.nodes[1].partial.token == 1
+    assert len(q.get_tokens(query.TokenRange(1, 2), query.TOKEN_NEAR_ITEM)) == 0
+    assert len(q.get_tokens(query.TokenRange(1, 2), query.TOKEN_QUALIFIER)) == 1
diff --git a/test/python/api/search/test_db_search_builder.py b/test/python/api/search/test_db_search_builder.py
index 371a6f02..be34fbea 100644
--- a/test/python/api/search/test_db_search_builder.py
+++ b/test/python/api/search/test_db_search_builder.py
@@ -9,38 +9,39 @@ Tests for creating abstract searches from token assignments.
 """
 import pytest
 
-from nominatim_api.search.query import Token, TokenRange, BreakType, PhraseType, TokenType, QueryStruct, Phrase
+from nominatim_api.search.query import Token, TokenRange, QueryStruct, Phrase
+import nominatim_api.search.query as qmod
 from nominatim_api.search.db_search_builder import SearchBuilder
 from nominatim_api.search.token_assignment import TokenAssignment
 from nominatim_api.types import SearchDetails
 import nominatim_api.search.db_searches as dbs
 
+
 class MyToken(Token):
     def get_category(self):
         return 'this', 'that'
 
 
 def make_query(*args):
-    q = QueryStruct([Phrase(PhraseType.NONE, '')])
+    q = QueryStruct([Phrase(qmod.PHRASE_ANY, '')])
 
     for _ in range(max(inner[0] for tlist in args for inner in tlist)):
-        q.add_node(BreakType.WORD, PhraseType.NONE)
-    q.add_node(BreakType.END, PhraseType.NONE)
+        q.add_node(qmod.BREAK_WORD, qmod.PHRASE_ANY)
+    q.add_node(qmod.BREAK_END, qmod.PHRASE_ANY)
 
     for start, tlist in enumerate(args):
         for end, ttype, tinfo in tlist:
             for tid, word in tinfo:
                 q.add_token(TokenRange(start, end), ttype,
-                            MyToken(penalty=0.5 if ttype == TokenType.PARTIAL else 0.0,
+                            MyToken(penalty=0.5 if ttype == qmod.TOKEN_PARTIAL else 0.0,
                                     token=tid, count=1, addr_count=1,
                                     lookup_word=word))
 
-
     return q
 
 
 def test_country_search():
-    q = make_query([(1, TokenType.COUNTRY, [(2, 'de'), (3, 'en')])])
+    q = make_query([(1, qmod.TOKEN_COUNTRY, [(2, 'de'), (3, 'en')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(country=TokenRange(0, 1))))
@@ -54,7 +55,7 @@ def test_country_search():
 
 
 def test_country_search_with_country_restriction():
-    q = make_query([(1, TokenType.COUNTRY, [(2, 'de'), (3, 'en')])])
+    q = make_query([(1, qmod.TOKEN_COUNTRY, [(2, 'de'), (3, 'en')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs({'countries': 'en,fr'}))
 
     searches = list(builder.build(TokenAssignment(country=TokenRange(0, 1))))
@@ -68,7 +69,7 @@ def test_country_search_with_country_restriction():
 
 
 def test_country_search_with_conflicting_country_restriction():
-    q = make_query([(1, TokenType.COUNTRY, [(2, 'de'), (3, 'en')])])
+    q = make_query([(1, qmod.TOKEN_COUNTRY, [(2, 'de'), (3, 'en')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs({'countries': 'fr'}))
 
     searches = list(builder.build(TokenAssignment(country=TokenRange(0, 1))))
@@ -77,7 +78,7 @@ def test_country_search_with_conflicting_country_restriction():
 
 
 def test_postcode_search_simple():
-    q = make_query([(1, TokenType.POSTCODE, [(34, '2367')])])
+    q = make_query([(1, qmod.TOKEN_POSTCODE, [(34, '2367')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(postcode=TokenRange(0, 1))))
@@ -93,8 +94,8 @@ def test_postcode_search_simple():
 
 
 def test_postcode_with_country():
-    q = make_query([(1, TokenType.POSTCODE, [(34, '2367')])],
-                   [(2, TokenType.COUNTRY, [(1, 'xx')])])
+    q = make_query([(1, qmod.TOKEN_POSTCODE, [(34, '2367')])],
+                   [(2, qmod.TOKEN_COUNTRY, [(1, 'xx')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(postcode=TokenRange(0, 1),
@@ -111,8 +112,8 @@ def test_postcode_with_country():
 
 
 def test_postcode_with_address():
-    q = make_query([(1, TokenType.POSTCODE, [(34, '2367')])],
-                   [(2, TokenType.PARTIAL, [(100, 'word')])])
+    q = make_query([(1, qmod.TOKEN_POSTCODE, [(34, '2367')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(100, 'word')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(postcode=TokenRange(0, 1),
@@ -129,9 +130,9 @@ def test_postcode_with_address():
 
 
 def test_postcode_with_address_with_full_word():
-    q = make_query([(1, TokenType.POSTCODE, [(34, '2367')])],
-                   [(2, TokenType.PARTIAL, [(100, 'word')]),
-                    (2, TokenType.WORD, [(1, 'full')])])
+    q = make_query([(1, qmod.TOKEN_POSTCODE, [(34, '2367')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(100, 'word')]),
+                    (2, qmod.TOKEN_WORD, [(1, 'full')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(postcode=TokenRange(0, 1),
@@ -150,7 +151,7 @@ def test_postcode_with_address_with_full_word():
 @pytest.mark.parametrize('kwargs', [{'viewbox': '0,0,1,1', 'bounded_viewbox': True},
                                     {'near': '10,10'}])
 def test_near_item_only(kwargs):
-    q = make_query([(1, TokenType.NEAR_ITEM, [(2, 'foo')])])
+    q = make_query([(1, qmod.TOKEN_NEAR_ITEM, [(2, 'foo')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs(kwargs))
 
     searches = list(builder.build(TokenAssignment(near_item=TokenRange(0, 1))))
@@ -166,7 +167,7 @@ def test_near_item_only(kwargs):
 @pytest.mark.parametrize('kwargs', [{'viewbox': '0,0,1,1'},
                                     {}])
 def test_near_item_skipped(kwargs):
-    q = make_query([(1, TokenType.NEAR_ITEM, [(2, 'foo')])])
+    q = make_query([(1, qmod.TOKEN_NEAR_ITEM, [(2, 'foo')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs(kwargs))
 
     searches = list(builder.build(TokenAssignment(near_item=TokenRange(0, 1))))
@@ -175,8 +176,8 @@ def test_near_item_skipped(kwargs):
 
 
 def test_name_only_search():
-    q = make_query([(1, TokenType.PARTIAL, [(1, 'a')]),
-                    (1, TokenType.WORD, [(100, 'a')])])
+    q = make_query([(1, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (1, qmod.TOKEN_WORD, [(100, 'a')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(0, 1))))
@@ -194,9 +195,9 @@ def test_name_only_search():
 
 
 def test_name_with_qualifier():
-    q = make_query([(1, TokenType.PARTIAL, [(1, 'a')]),
-                    (1, TokenType.WORD, [(100, 'a')])],
-                   [(2, TokenType.QUALIFIER, [(55, 'hotel')])])
+    q = make_query([(1, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (1, qmod.TOKEN_WORD, [(100, 'a')])],
+                   [(2, qmod.TOKEN_QUALIFIER, [(55, 'hotel')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(0, 1),
@@ -215,9 +216,9 @@ def test_name_with_qualifier():
 
 
 def test_name_with_housenumber_search():
-    q = make_query([(1, TokenType.PARTIAL, [(1, 'a')]),
-                    (1, TokenType.WORD, [(100, 'a')])],
-                   [(2, TokenType.HOUSENUMBER, [(66, '66')])])
+    q = make_query([(1, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (1, qmod.TOKEN_WORD, [(100, 'a')])],
+                   [(2, qmod.TOKEN_HOUSENUMBER, [(66, '66')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(0, 1),
@@ -235,13 +236,12 @@ def test_name_with_housenumber_search():
 
 
 def test_name_and_address():
-    q = make_query([(1, TokenType.PARTIAL, [(1, 'a')]),
-                    (1, TokenType.WORD, [(100, 'a')])],
-                   [(2, TokenType.PARTIAL, [(2, 'b')]),
-                    (2, TokenType.WORD, [(101, 'b')])],
-                   [(3, TokenType.PARTIAL, [(3, 'c')]),
-                    (3, TokenType.WORD, [(102, 'c')])]
-                  )
+    q = make_query([(1, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (1, qmod.TOKEN_WORD, [(100, 'a')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(2, 'b')]),
+                    (2, qmod.TOKEN_WORD, [(101, 'b')])],
+                   [(3, qmod.TOKEN_PARTIAL, [(3, 'c')]),
+                    (3, qmod.TOKEN_WORD, [(102, 'c')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(0, 1),
@@ -260,14 +260,13 @@ def test_name_and_address():
 
 
 def test_name_and_complex_address():
-    q = make_query([(1, TokenType.PARTIAL, [(1, 'a')]),
-                    (1, TokenType.WORD, [(100, 'a')])],
-                   [(2, TokenType.PARTIAL, [(2, 'b')]),
-                    (3, TokenType.WORD, [(101, 'bc')])],
-                   [(3, TokenType.PARTIAL, [(3, 'c')])],
-                   [(4, TokenType.PARTIAL, [(4, 'd')]),
-                    (4, TokenType.WORD, [(103, 'd')])]
-                  )
+    q = make_query([(1, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (1, qmod.TOKEN_WORD, [(100, 'a')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(2, 'b')]),
+                    (3, qmod.TOKEN_WORD, [(101, 'bc')])],
+                   [(3, qmod.TOKEN_PARTIAL, [(3, 'c')])],
+                   [(4, qmod.TOKEN_PARTIAL, [(4, 'd')]),
+                    (4, qmod.TOKEN_WORD, [(103, 'd')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(0, 1),
@@ -286,9 +285,9 @@ def test_name_and_complex_address():
 
 
 def test_name_only_near_search():
-    q = make_query([(1, TokenType.NEAR_ITEM, [(88, 'g')])],
-                   [(2, TokenType.PARTIAL, [(1, 'a')]),
-                    (2, TokenType.WORD, [(100, 'a')])])
+    q = make_query([(1, qmod.TOKEN_NEAR_ITEM, [(88, 'g')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (2, qmod.TOKEN_WORD, [(100, 'a')])])
     builder = SearchBuilder(q, SearchDetails())
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(1, 2),
@@ -302,8 +301,8 @@ def test_name_only_near_search():
 
 
 def test_name_only_search_with_category():
-    q = make_query([(1, TokenType.PARTIAL, [(1, 'a')]),
-                    (1, TokenType.WORD, [(100, 'a')])])
+    q = make_query([(1, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (1, qmod.TOKEN_WORD, [(100, 'a')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs({'categories': [('foo', 'bar')]}))
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(0, 1))))
@@ -316,9 +315,9 @@ def test_name_only_search_with_category():
 
 
 def test_name_with_near_item_search_with_category_mismatch():
-    q = make_query([(1, TokenType.NEAR_ITEM, [(88, 'g')])],
-                   [(2, TokenType.PARTIAL, [(1, 'a')]),
-                    (2, TokenType.WORD, [(100, 'a')])])
+    q = make_query([(1, qmod.TOKEN_NEAR_ITEM, [(88, 'g')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (2, qmod.TOKEN_WORD, [(100, 'a')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs({'categories': [('foo', 'bar')]}))
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(1, 2),
@@ -328,9 +327,9 @@ def test_name_with_near_item_search_with_category_mismatch():
 
 
 def test_name_with_near_item_search_with_category_match():
-    q = make_query([(1, TokenType.NEAR_ITEM, [(88, 'g')])],
-                   [(2, TokenType.PARTIAL, [(1, 'a')]),
-                    (2, TokenType.WORD, [(100, 'a')])])
+    q = make_query([(1, qmod.TOKEN_NEAR_ITEM, [(88, 'g')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (2, qmod.TOKEN_WORD, [(100, 'a')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs({'categories': [('foo', 'bar'),
                                                                          ('this', 'that')]}))
 
@@ -345,9 +344,9 @@ def test_name_with_near_item_search_with_category_match():
 
 
 def test_name_with_qualifier_search_with_category_mismatch():
-    q = make_query([(1, TokenType.QUALIFIER, [(88, 'g')])],
-                   [(2, TokenType.PARTIAL, [(1, 'a')]),
-                    (2, TokenType.WORD, [(100, 'a')])])
+    q = make_query([(1, qmod.TOKEN_QUALIFIER, [(88, 'g')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (2, qmod.TOKEN_WORD, [(100, 'a')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs({'categories': [('foo', 'bar')]}))
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(1, 2),
@@ -357,9 +356,9 @@ def test_name_with_qualifier_search_with_category_mismatch():
 
 
 def test_name_with_qualifier_search_with_category_match():
-    q = make_query([(1, TokenType.QUALIFIER, [(88, 'g')])],
-                   [(2, TokenType.PARTIAL, [(1, 'a')]),
-                    (2, TokenType.WORD, [(100, 'a')])])
+    q = make_query([(1, qmod.TOKEN_QUALIFIER, [(88, 'g')])],
+                   [(2, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (2, qmod.TOKEN_WORD, [(100, 'a')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs({'categories': [('foo', 'bar'),
                                                                          ('this', 'that')]}))
 
@@ -374,8 +373,8 @@ def test_name_with_qualifier_search_with_category_match():
 
 
 def test_name_only_search_with_countries():
-    q = make_query([(1, TokenType.PARTIAL, [(1, 'a')]),
-                    (1, TokenType.WORD, [(100, 'a')])])
+    q = make_query([(1, qmod.TOKEN_PARTIAL, [(1, 'a')]),
+                    (1, qmod.TOKEN_WORD, [(100, 'a')])])
     builder = SearchBuilder(q, SearchDetails.from_kwargs({'countries': 'de,en'}))
 
     searches = list(builder.build(TokenAssignment(name=TokenRange(0, 1))))
@@ -391,19 +390,19 @@ def test_name_only_search_with_countries():
 
 def make_counted_searches(name_part, name_full, address_part, address_full,
                           num_address_parts=1):
-    q = QueryStruct([Phrase(PhraseType.NONE, '')])
+    q = QueryStruct([Phrase(qmod.PHRASE_ANY, '')])
     for i in range(1 + num_address_parts):
-        q.add_node(BreakType.WORD, PhraseType.NONE)
-    q.add_node(BreakType.END, PhraseType.NONE)
+        q.add_node(qmod.BREAK_WORD, qmod.PHRASE_ANY)
+    q.add_node(qmod.BREAK_END, qmod.PHRASE_ANY)
 
-    q.add_token(TokenRange(0, 1), TokenType.PARTIAL,
+    q.add_token(TokenRange(0, 1), qmod.TOKEN_PARTIAL,
                 MyToken(0.5, 1, name_part, 1, 'name_part'))
-    q.add_token(TokenRange(0, 1), TokenType.WORD,
+    q.add_token(TokenRange(0, 1), qmod.TOKEN_WORD,
                 MyToken(0, 101, name_full, 1, 'name_full'))
     for i in range(num_address_parts):
-        q.add_token(TokenRange(i + 1, i + 2), TokenType.PARTIAL,
+        q.add_token(TokenRange(i + 1, i + 2), qmod.TOKEN_PARTIAL,
                     MyToken(0.5, 2, address_part, 1, 'address_part'))
-        q.add_token(TokenRange(i + 1, i + 2), TokenType.WORD,
+        q.add_token(TokenRange(i + 1, i + 2), qmod.TOKEN_WORD,
                     MyToken(0, 102, address_full, 1, 'address_full'))
 
     builder = SearchBuilder(q, SearchDetails())
@@ -422,8 +421,8 @@ def test_infrequent_partials_in_name():
     assert len(search.lookups) == 2
     assert len(search.rankings) == 2
 
-    assert set((l.column, l.lookup_type.__name__) for l in search.lookups) == \
-            {('name_vector', 'LookupAll'), ('nameaddress_vector', 'Restrict')}
+    assert set((s.column, s.lookup_type.__name__) for s in search.lookups) == \
+        {('name_vector', 'LookupAll'), ('nameaddress_vector', 'Restrict')}
 
 
 def test_frequent_partials_in_name_and_address():
@@ -434,10 +433,10 @@ def test_frequent_partials_in_name_and_address():
     assert all(isinstance(s, dbs.PlaceSearch) for s in searches)
     searches.sort(key=lambda s: s.penalty)
 
-    assert set((l.column, l.lookup_type.__name__) for l in searches[0].lookups) == \
-            {('name_vector', 'LookupAny'), ('nameaddress_vector', 'Restrict')}
-    assert set((l.column, l.lookup_type.__name__) for l in searches[1].lookups) == \
-            {('nameaddress_vector', 'LookupAll'), ('name_vector', 'LookupAll')}
+    assert set((s.column, s.lookup_type.__name__) for s in searches[0].lookups) == \
+        {('name_vector', 'LookupAny'), ('nameaddress_vector', 'Restrict')}
+    assert set((s.column, s.lookup_type.__name__) for s in searches[1].lookups) == \
+        {('nameaddress_vector', 'LookupAll'), ('name_vector', 'LookupAll')}
 
 
 def test_too_frequent_partials_in_name_and_address():
@@ -448,5 +447,5 @@ def test_too_frequent_partials_in_name_and_address():
     assert all(isinstance(s, dbs.PlaceSearch) for s in searches)
     searches.sort(key=lambda s: s.penalty)
 
-    assert set((l.column, l.lookup_type.__name__) for l in searches[0].lookups) == \
-            {('name_vector', 'LookupAny'), ('nameaddress_vector', 'Restrict')}
+    assert set((s.column, s.lookup_type.__name__) for s in searches[0].lookups) == \
+        {('name_vector', 'LookupAny'), ('nameaddress_vector', 'Restrict')}
diff --git a/test/python/api/search/test_icu_query_analyzer.py b/test/python/api/search/test_icu_query_analyzer.py
index ac4bcbb7..39ec8fd6 100644
--- a/test/python/api/search/test_icu_query_analyzer.py
+++ b/test/python/api/search/test_icu_query_analyzer.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for query analyzer for ICU tokenizer.
@@ -11,11 +11,13 @@ import pytest
 import pytest_asyncio
 
 from nominatim_api import NominatimAPIAsync
-from nominatim_api.search.query import Phrase, PhraseType, TokenType, BreakType
+from nominatim_api.search.query import Phrase
+import nominatim_api.search.query as qmod
 import nominatim_api.search.icu_tokenizer as tok
 from nominatim_api.logging import set_log_output, get_and_disable
 
-async def add_word(conn, word_id, word_token, wtype, word, info = None):
+
+async def add_word(conn, word_id, word_token, wtype, word, info=None):
     t = conn.t.meta.tables['word']
     await conn.execute(t.insert(), {'word_id': word_id,
                                     'word_token': word_token,
@@ -25,7 +27,8 @@ async def add_word(conn, word_id, word_token, wtype, word, info = None):
 
 
 def make_phrase(query):
-    return [Phrase(PhraseType.NONE, s) for s in query.split(',')]
+    return [Phrase(qmod.PHRASE_ANY, s) for s in query.split(',')]
+
 
 @pytest_asyncio.fixture
 async def conn(table_factory):
@@ -62,12 +65,12 @@ async def test_single_phrase_with_unknown_terms(conn):
     query = await ana.analyze_query(make_phrase('foo BAR'))
 
     assert len(query.source) == 1
-    assert query.source[0].ptype == PhraseType.NONE
+    assert query.source[0].ptype == qmod.PHRASE_ANY
     assert query.source[0].text == 'foo bar'
 
     assert query.num_token_slots() == 2
-    assert len(query.nodes[0].starting) == 1
-    assert not query.nodes[1].starting
+    assert query.nodes[0].partial.token == 1
+    assert query.nodes[1].partial is None
 
 
 @pytest.mark.asyncio
@@ -96,17 +99,15 @@ async def test_splitting_in_transliteration(conn):
     assert query.num_token_slots() == 2
     assert query.nodes[0].starting
     assert query.nodes[1].starting
-    assert query.nodes[1].btype == BreakType.TOKEN
+    assert query.nodes[1].btype == qmod.BREAK_TOKEN
 
 
 @pytest.mark.asyncio
-@pytest.mark.parametrize('term,order', [('23456', ['POSTCODE', 'HOUSENUMBER', 'WORD', 'PARTIAL']),
-                                        ('3', ['HOUSENUMBER', 'POSTCODE', 'WORD', 'PARTIAL'])
-                                       ])
+@pytest.mark.parametrize('term,order', [('23456', ['P', 'H', 'W']),
+                                        ('3', ['H', 'W'])])
 async def test_penalty_postcodes_and_housenumbers(conn, term, order):
     ana = await tok.create_query_analyzer(conn)
 
-    await add_word(conn, 1, term, 'P', None)
     await add_word(conn, 2, term, 'H', term)
     await add_word(conn, 3, term, 'w', term)
     await add_word(conn, 4, term, 'W', term)
@@ -115,11 +116,12 @@ async def test_penalty_postcodes_and_housenumbers(conn, term, order):
 
     assert query.num_token_slots() == 1
 
-    torder = [(tl.tokens[0].penalty, tl.ttype.name) for tl in query.nodes[0].starting]
+    torder = [(tl.tokens[0].penalty, tl.ttype) for tl in query.nodes[0].starting]
     torder.sort()
 
     assert [t[1] for t in torder] == order
 
+
 @pytest.mark.asyncio
 async def test_category_words_only_at_beginning(conn):
     ana = await tok.create_query_analyzer(conn)
@@ -131,7 +133,7 @@ async def test_category_words_only_at_beginning(conn):
 
     assert query.num_token_slots() == 3
     assert len(query.nodes[0].starting) == 1
-    assert query.nodes[0].starting[0].ttype == TokenType.NEAR_ITEM
+    assert query.nodes[0].starting[0].ttype == qmod.TOKEN_NEAR_ITEM
     assert not query.nodes[2].starting
 
 
@@ -145,7 +147,7 @@ async def test_freestanding_qualifier_words_become_category(conn):
 
     assert query.num_token_slots() == 1
     assert len(query.nodes[0].starting) == 1
-    assert query.nodes[0].starting[0].ttype == TokenType.NEAR_ITEM
+    assert query.nodes[0].starting[0].ttype == qmod.TOKEN_NEAR_ITEM
 
 
 @pytest.mark.asyncio
@@ -158,9 +160,9 @@ async def test_qualifier_words(conn):
     query = await ana.analyze_query(make_phrase('foo BAR foo BAR foo'))
 
     assert query.num_token_slots() == 5
-    assert set(t.ttype for t in query.nodes[0].starting) == {TokenType.QUALIFIER}
-    assert set(t.ttype for t in query.nodes[2].starting) == {TokenType.QUALIFIER}
-    assert set(t.ttype for t in query.nodes[4].starting) == {TokenType.QUALIFIER}
+    assert set(t.ttype for t in query.nodes[0].starting) == {qmod.TOKEN_QUALIFIER}
+    assert set(t.ttype for t in query.nodes[2].starting) == {qmod.TOKEN_QUALIFIER}
+    assert set(t.ttype for t in query.nodes[4].starting) == {qmod.TOKEN_QUALIFIER}
 
 
 @pytest.mark.asyncio
@@ -172,14 +174,16 @@ async def test_add_unknown_housenumbers(conn):
     query = await ana.analyze_query(make_phrase('466 23 99834 34a'))
 
     assert query.num_token_slots() == 4
-    assert query.nodes[0].starting[0].ttype == TokenType.HOUSENUMBER
+    assert query.nodes[0].starting[0].ttype == qmod.TOKEN_HOUSENUMBER
     assert len(query.nodes[0].starting[0].tokens) == 1
     assert query.nodes[0].starting[0].tokens[0].token == 0
-    assert query.nodes[1].starting[0].ttype == TokenType.HOUSENUMBER
+    assert query.nodes[1].starting[0].ttype == qmod.TOKEN_HOUSENUMBER
     assert len(query.nodes[1].starting[0].tokens) == 1
     assert query.nodes[1].starting[0].tokens[0].token == 1
-    assert not query.nodes[2].starting
-    assert not query.nodes[3].starting
+    assert query.nodes[2].has_tokens(3, qmod.TOKEN_POSTCODE)
+    assert not query.nodes[2].has_tokens(3, qmod.TOKEN_HOUSENUMBER)
+    assert not query.nodes[2].has_tokens(4, qmod.TOKEN_HOUSENUMBER)
+    assert not query.nodes[3].has_tokens(4, qmod.TOKEN_HOUSENUMBER)
 
 
 @pytest.mark.asyncio
diff --git a/test/python/api/search/test_postcode_parser.py b/test/python/api/search/test_postcode_parser.py
new file mode 100644
index 00000000..f7d78857
--- /dev/null
+++ b/test/python/api/search/test_postcode_parser.py
@@ -0,0 +1,171 @@
+
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Test for parsing of postcodes in queries.
+"""
+import re
+from itertools import zip_longest
+
+import pytest
+
+from nominatim_api.search.postcode_parser import PostcodeParser
+from nominatim_api.search.query import QueryStruct, PHRASE_ANY, PHRASE_POSTCODE, PHRASE_STREET
+
+
+@pytest.fixture
+def pc_config(project_env):
+    country_file = project_env.project_dir / 'country_settings.yaml'
+    country_file.write_text(r"""
+ab:
+  postcode:
+    pattern: "ddddd ll"
+ba:
+  postcode:
+    pattern: "ddddd"
+de:
+  postcode:
+    pattern: "ddddd"
+gr:
+  postcode:
+    pattern: "(ddd) ?(dd)"
+    output: \1 \2
+in:
+  postcode:
+    pattern: "(ddd) ?(ddd)"
+    output: \1\2
+mc:
+  postcode:
+    pattern: "980dd"
+mz:
+  postcode:
+    pattern: "(dddd)(?:-dd)?"
+bn:
+  postcode:
+    pattern: "(ll) ?(dddd)"
+    output: \1\2
+ky:
+  postcode:
+    pattern: "(d)-(dddd)"
+    output: KY\1-\2
+
+gb:
+  postcode:
+    pattern: "(l?ld[A-Z0-9]?) ?(dll)"
+    output: \1 \2
+
+    """)
+
+    return project_env
+
+
+def mk_query(inp):
+    query = QueryStruct([])
+    phrase_split = re.split(r"([ ,:'-])", inp)
+
+    for word, breakchar in zip_longest(*[iter(phrase_split)]*2, fillvalue='>'):
+        query.add_node(breakchar, PHRASE_ANY, 0.1, word, word)
+
+    return query
+
+
+@pytest.mark.parametrize('query,pos', [('45325 Berlin', 0),
+                                       ('45325:Berlin', 0),
+                                       ('45325,Berlin', 0),
+                                       ('Berlin 45325', 1),
+                                       ('Berlin,45325', 1),
+                                       ('Berlin:45325', 1),
+                                       ('Hansastr,45325 Berlin', 1),
+                                       ('Hansastr 45325 Berlin', 1)])
+def test_simple_postcode(pc_config, query, pos):
+    parser = PostcodeParser(pc_config)
+
+    result = parser.parse(mk_query(query))
+
+    assert result == {(pos, pos + 1, '45325'), (pos, pos + 1, '453 25')}
+
+
+@pytest.mark.parametrize('query', ['EC1R 3HF', 'ec1r 3hf'])
+def test_postcode_matching_case_insensitive(pc_config, query):
+    parser = PostcodeParser(pc_config)
+
+    assert parser.parse(mk_query(query)) == {(0, 2, 'EC1R 3HF')}
+
+
+def test_contained_postcode(pc_config):
+    parser = PostcodeParser(pc_config)
+
+    assert parser.parse(mk_query('12345 dx')) == {(0, 1, '12345'), (0, 1, '123 45'),
+                                                  (0, 2, '12345 DX')}
+
+
+@pytest.mark.parametrize('query,frm,to', [('345987', 0, 1), ('345 987', 0, 2),
+                                          ('Aina 345 987', 1, 3),
+                                          ('Aina 23 345 987 ff', 2, 4)])
+def test_postcode_with_space(pc_config, query, frm, to):
+    parser = PostcodeParser(pc_config)
+
+    result = parser.parse(mk_query(query))
+
+    assert result == {(frm, to, '345987')}
+
+
+def test_overlapping_postcode(pc_config):
+    parser = PostcodeParser(pc_config)
+
+    assert parser.parse(mk_query('123 456 78')) == {(0, 2, '123456'), (1, 3, '456 78')}
+
+
+@pytest.mark.parametrize('query', ['45325-Berlin', "45325'Berlin",
+                                   'Berlin-45325', "Berlin'45325", '45325Berlin'
+                                   '345-987', "345'987", '345,987', '345:987'])
+def test_not_a_postcode(pc_config, query):
+    parser = PostcodeParser(pc_config)
+
+    assert not parser.parse(mk_query(query))
+
+
+@pytest.mark.parametrize('query', ['ba 12233', 'ba-12233'])
+def test_postcode_with_country_prefix(pc_config, query):
+    parser = PostcodeParser(pc_config)
+
+    assert (0, 2, '12233') in parser.parse(mk_query(query))
+
+
+def test_postcode_with_joined_country_prefix(pc_config):
+    parser = PostcodeParser(pc_config)
+
+    assert parser.parse(mk_query('ba12233')) == {(0, 1, '12233')}
+
+
+def test_postcode_with_non_matching_country_prefix(pc_config):
+    parser = PostcodeParser(pc_config)
+
+    assert not parser.parse(mk_query('ky12233'))
+
+
+def test_postcode_inside_postcode_phrase(pc_config):
+    parser = PostcodeParser(pc_config)
+
+    query = QueryStruct([])
+    query.nodes[-1].ptype = PHRASE_STREET
+    query.add_node(',', PHRASE_STREET, 0.1, '12345', '12345')
+    query.add_node(',', PHRASE_POSTCODE, 0.1, 'xz', 'xz')
+    query.add_node('>', PHRASE_POSTCODE, 0.1, '4444', '4444')
+
+    assert parser.parse(query) == {(2, 3, '4444')}
+
+
+def test_partial_postcode_in_postcode_phrase(pc_config):
+    parser = PostcodeParser(pc_config)
+
+    query = QueryStruct([])
+    query.nodes[-1].ptype = PHRASE_POSTCODE
+    query.add_node(' ', PHRASE_POSTCODE, 0.1, '2224', '2224')
+    query.add_node('>', PHRASE_POSTCODE, 0.1, '12345', '12345')
+
+    assert not parser.parse(query)
diff --git a/test/python/api/search/test_query.py b/test/python/api/search/test_query.py
index c39094f0..09f25f8e 100644
--- a/test/python/api/search/test_query.py
+++ b/test/python/api/search/test_query.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Test data types for search queries.
@@ -11,14 +11,15 @@ import pytest
 
 import nominatim_api.search.query as nq
 
+
 def test_token_range_equal():
     assert nq.TokenRange(2, 3) == nq.TokenRange(2, 3)
     assert not (nq.TokenRange(2, 3) != nq.TokenRange(2, 3))
 
 
 @pytest.mark.parametrize('lop,rop', [((1, 2), (3, 4)),
-                                    ((3, 4), (3, 5)),
-                                    ((10, 12), (11, 12))])
+                                     ((3, 4), (3, 5)),
+                                     ((10, 12), (11, 12))])
 def test_token_range_unequal(lop, rop):
     assert not (nq.TokenRange(*lop) == nq.TokenRange(*rop))
     assert nq.TokenRange(*lop) != nq.TokenRange(*rop)
@@ -28,17 +29,17 @@ def test_token_range_lt():
     assert nq.TokenRange(1, 3) < nq.TokenRange(10, 12)
     assert nq.TokenRange(5, 6) < nq.TokenRange(7, 8)
     assert nq.TokenRange(1, 4) < nq.TokenRange(4, 5)
-    assert not(nq.TokenRange(5, 6) < nq.TokenRange(5, 6))
-    assert not(nq.TokenRange(10, 11) < nq.TokenRange(4, 5))
+    assert not (nq.TokenRange(5, 6) < nq.TokenRange(5, 6))
+    assert not (nq.TokenRange(10, 11) < nq.TokenRange(4, 5))
 
 
 def test_token_rankge_gt():
     assert nq.TokenRange(3, 4) > nq.TokenRange(1, 2)
     assert nq.TokenRange(100, 200) > nq.TokenRange(10, 11)
     assert nq.TokenRange(10, 11) > nq.TokenRange(4, 10)
-    assert not(nq.TokenRange(5, 6) > nq.TokenRange(5, 6))
-    assert not(nq.TokenRange(1, 2) > nq.TokenRange(3, 4))
-    assert not(nq.TokenRange(4, 10) > nq.TokenRange(3, 5))
+    assert not (nq.TokenRange(5, 6) > nq.TokenRange(5, 6))
+    assert not (nq.TokenRange(1, 2) > nq.TokenRange(3, 4))
+    assert not (nq.TokenRange(4, 10) > nq.TokenRange(3, 5))
 
 
 def test_token_range_unimplemented_ops():
@@ -46,3 +47,19 @@ def test_token_range_unimplemented_ops():
         nq.TokenRange(1, 3) <= nq.TokenRange(10, 12)
     with pytest.raises(TypeError):
         nq.TokenRange(1, 3) >= nq.TokenRange(10, 12)
+
+
+def test_query_extract_words():
+    q = nq.QueryStruct([])
+    q.add_node(nq.BREAK_WORD, nq.PHRASE_ANY, 0.1, '12', '')
+    q.add_node(nq.BREAK_TOKEN, nq.PHRASE_ANY, 0.0, 'ab', '')
+    q.add_node(nq.BREAK_PHRASE, nq.PHRASE_ANY, 0.0, '12', '')
+    q.add_node(nq.BREAK_END, nq.PHRASE_ANY, 0.5, 'hallo', '')
+
+    words = q.extract_words(base_penalty=1.0)
+
+    assert set(words.keys()) \
+        == {'12', 'ab', 'hallo', '12 ab', 'ab 12', '12 ab 12'}
+    assert sorted(words['12']) == [nq.TokenRange(0, 1, 1.0), nq.TokenRange(2, 3, 1.0)]
+    assert words['12 ab'] == [nq.TokenRange(0, 2, 1.1)]
+    assert words['hallo'] == [nq.TokenRange(3, 4, 1.0)]
diff --git a/test/python/api/search/test_query_analyzer_factory.py b/test/python/api/search/test_query_analyzer_factory.py
index 42220b55..933bdd1f 100644
--- a/test/python/api/search/test_query_analyzer_factory.py
+++ b/test/python/api/search/test_query_analyzer_factory.py
@@ -2,18 +2,17 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for query analyzer creation.
 """
-from pathlib import Path
-
 import pytest
 
 from nominatim_api.search.query_analyzer_factory import make_query_analyzer
 from nominatim_api.search.icu_tokenizer import ICUQueryAnalyzer
 
+
 @pytest.mark.asyncio
 async def test_import_icu_tokenizer(table_factory, api):
     table_factory('nominatim_properties',
diff --git a/test/python/api/search/test_search_country.py b/test/python/api/search/test_search_country.py
index 2109ecb0..46875a2c 100644
--- a/test/python/api/search/test_search_country.py
+++ b/test/python/api/search/test_search_country.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for running the country searcher.
@@ -48,6 +48,7 @@ def test_find_from_placex(apiobj, frontend):
     assert results[0].place_id == 55
     assert results[0].accuracy == 0.8
 
+
 def test_find_from_fallback_countries(apiobj, frontend):
     apiobj.add_country('ro', 'POLYGON((0 0, 0 1, 1 1, 1 0, 0 0))')
     apiobj.add_country_name('ro', {'name': 'RomÃ¢nia'})
@@ -87,7 +88,6 @@ class TestCountryParameters:
         apiobj.add_country('ro', 'POLYGON((0 0, 0 1, 1 1, 1 0, 0 0))')
         apiobj.add_country_name('ro', {'name': 'RomÃ¢nia'})
 
-
     @pytest.mark.parametrize('geom', [napi.GeometryFormat.GEOJSON,
                                       napi.GeometryFormat.KML,
                                       napi.GeometryFormat.SVG,
@@ -100,7 +100,6 @@ class TestCountryParameters:
         assert len(results) == 1
         assert geom.name.lower() in results[0].geometry
 
-
     @pytest.mark.parametrize('pid,rids', [(76, [55]), (55, [])])
     def test_exclude_place_id(self, apiobj, frontend, pid, rids):
         results = run_search(apiobj, frontend, 0.5, ['yw', 'ro'],
@@ -108,7 +107,6 @@ class TestCountryParameters:
 
         assert [r.place_id for r in results] == rids
 
-
     @pytest.mark.parametrize('viewbox,rids', [((9, 9, 11, 11), [55]),
                                               ((-10, -10, -3, -3), [])])
     def test_bounded_viewbox_in_placex(self, apiobj, frontend, viewbox, rids):
@@ -118,9 +116,8 @@ class TestCountryParameters:
 
         assert [r.place_id for r in results] == rids
 
-
     @pytest.mark.parametrize('viewbox,numres', [((0, 0, 1, 1), 1),
-                                              ((-10, -10, -3, -3), 0)])
+                                                ((-10, -10, -3, -3), 0)])
     def test_bounded_viewbox_in_fallback(self, apiobj, frontend, viewbox, numres):
         results = run_search(apiobj, frontend, 0.5, ['ro'],
                              details=SearchDetails.from_kwargs({'viewbox': viewbox,
diff --git a/test/python/api/search/test_search_near.py b/test/python/api/search/test_search_near.py
index 43098ddd..e9650168 100644
--- a/test/python/api/search/test_search_near.py
+++ b/test/python/api/search/test_search_near.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for running the near searcher.
@@ -12,8 +12,8 @@ import pytest
 import nominatim_api as napi
 from nominatim_api.types import SearchDetails
 from nominatim_api.search.db_searches import NearSearch, PlaceSearch
-from nominatim_api.search.db_search_fields import WeightedStrings, WeightedCategories,\
-                                                  FieldLookup, FieldRanking, RankedTokens
+from nominatim_api.search.db_search_fields import WeightedStrings, WeightedCategories, \
+                                                  FieldLookup
 from nominatim_api.search.db_search_lookups import LookupAll
 
 
@@ -80,7 +80,6 @@ class TestNearSearch:
         apiobj.add_search_name(101, names=[56], country_code='mx',
                                centroid=(-10.3, 56.9))
 
-
     def test_near_in_placex(self, apiobj, frontend):
         apiobj.add_placex(place_id=22, class_='amenity', type='bank',
                           centroid=(5.6001, 4.2994))
@@ -91,7 +90,6 @@ class TestNearSearch:
 
         assert [r.place_id for r in results] == [22]
 
-
     def test_multiple_types_near_in_placex(self, apiobj, frontend):
         apiobj.add_placex(place_id=22, class_='amenity', type='bank',
                           importance=0.002,
@@ -105,7 +103,6 @@ class TestNearSearch:
 
         assert [r.place_id for r in results] == [22, 23]
 
-
     def test_near_in_classtype(self, apiobj, frontend):
         apiobj.add_placex(place_id=22, class_='amenity', type='bank',
                           centroid=(5.6, 4.34))
@@ -118,7 +115,6 @@ class TestNearSearch:
 
         assert [r.place_id for r in results] == [22]
 
-
     @pytest.mark.parametrize('cc,rid', [('us', 22), ('mx', 23)])
     def test_restrict_by_country(self, apiobj, frontend, cc, rid):
         apiobj.add_placex(place_id=22, class_='amenity', type='bank',
@@ -138,7 +134,6 @@ class TestNearSearch:
 
         assert [r.place_id for r in results] == [rid]
 
-
     @pytest.mark.parametrize('excluded,rid', [(22, 122), (122, 22)])
     def test_exclude_place_by_id(self, apiobj, frontend, excluded, rid):
         apiobj.add_placex(place_id=22, class_='amenity', type='bank',
@@ -148,13 +143,11 @@ class TestNearSearch:
                           centroid=(5.6001, 4.2994),
                           country_code='us')
 
-
         results = run_search(apiobj, frontend, 0.1, [('amenity', 'bank')],
                              details=SearchDetails(excluded=[excluded]))
 
         assert [r.place_id for r in results] == [rid]
 
-
     @pytest.mark.parametrize('layer,rids', [(napi.DataLayer.POI, [22]),
                                             (napi.DataLayer.MANMADE, [])])
     def test_with_layer(self, apiobj, frontend, layer, rids):
diff --git a/test/python/api/search/test_search_places.py b/test/python/api/search/test_search_places.py
index c6ff16b8..ed0722c3 100644
--- a/test/python/api/search/test_search_places.py
+++ b/test/python/api/search/test_search_places.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for running the generic place searcher.
@@ -14,12 +14,13 @@ import pytest
 import nominatim_api as napi
 from nominatim_api.types import SearchDetails
 from nominatim_api.search.db_searches import PlaceSearch
-from nominatim_api.search.db_search_fields import WeightedStrings, WeightedCategories,\
+from nominatim_api.search.db_search_fields import WeightedStrings, WeightedCategories, \
                                                   FieldLookup, FieldRanking, RankedTokens
 from nominatim_api.search.db_search_lookups import LookupAll, LookupAny, Restrict
 
 APIOPTIONS = ['search']
 
+
 def run_search(apiobj, frontend, global_penalty, lookup, ranking, count=2,
                hnrs=[], pcs=[], ccodes=[], quals=[],
                details=SearchDetails()):
@@ -55,29 +56,27 @@ class TestNameOnlySearches:
     def fill_database(self, apiobj):
         apiobj.add_placex(place_id=100, country_code='us',
                           centroid=(5.6, 4.3))
-        apiobj.add_search_name(100, names=[1,2,10,11], country_code='us',
+        apiobj.add_search_name(100, names=[1, 2, 10, 11], country_code='us',
                                centroid=(5.6, 4.3))
         apiobj.add_placex(place_id=101, country_code='mx',
                           centroid=(-10.3, 56.9))
-        apiobj.add_search_name(101, names=[1,2,20,21], country_code='mx',
+        apiobj.add_search_name(101, names=[1, 2, 20, 21], country_code='mx',
                                centroid=(-10.3, 56.9))
 
-
     @pytest.mark.parametrize('lookup_type', [LookupAll, Restrict])
     @pytest.mark.parametrize('rank,res', [([10], [100, 101]),
                                           ([20], [101, 100])])
     def test_lookup_all_match(self, apiobj, frontend, lookup_type, rank, res):
-        lookup = FieldLookup('name_vector', [1,2], lookup_type)
+        lookup = FieldLookup('name_vector', [1, 2], lookup_type)
         ranking = FieldRanking('name_vector', 0.4, [RankedTokens(0.0, rank)])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking])
 
         assert [r.place_id for r in results] == res
 
-
     @pytest.mark.parametrize('lookup_type', [LookupAll, Restrict])
     def test_lookup_all_partial_match(self, apiobj, frontend, lookup_type):
-        lookup = FieldLookup('name_vector', [1,20], lookup_type)
+        lookup = FieldLookup('name_vector', [1, 20], lookup_type)
         ranking = FieldRanking('name_vector', 0.4, [RankedTokens(0.0, [21])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking])
@@ -88,14 +87,13 @@ class TestNameOnlySearches:
     @pytest.mark.parametrize('rank,res', [([10], [100, 101]),
                                           ([20], [101, 100])])
     def test_lookup_any_match(self, apiobj, frontend, rank, res):
-        lookup = FieldLookup('name_vector', [11,21], LookupAny)
+        lookup = FieldLookup('name_vector', [11, 21], LookupAny)
         ranking = FieldRanking('name_vector', 0.4, [RankedTokens(0.0, rank)])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking])
 
         assert [r.place_id for r in results] == res
 
-
     def test_lookup_any_partial_match(self, apiobj, frontend):
         lookup = FieldLookup('name_vector', [20], LookupAll)
         ranking = FieldRanking('name_vector', 0.4, [RankedTokens(0.0, [21])])
@@ -105,19 +103,17 @@ class TestNameOnlySearches:
         assert len(results) == 1
         assert results[0].place_id == 101
 
-
     @pytest.mark.parametrize('cc,res', [('us', 100), ('mx', 101)])
     def test_lookup_restrict_country(self, apiobj, frontend, cc, res):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.4, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking], ccodes=[cc])
 
         assert [r.place_id for r in results] == [res]
 
-
     def test_lookup_restrict_placeid(self, apiobj, frontend):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.4, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking],
@@ -125,7 +121,6 @@ class TestNameOnlySearches:
 
         assert [r.place_id for r in results] == [100]
 
-
     @pytest.mark.parametrize('geom', [napi.GeometryFormat.GEOJSON,
                                       napi.GeometryFormat.KML,
                                       napi.GeometryFormat.SVG,
@@ -139,7 +134,6 @@ class TestNameOnlySearches:
 
         assert geom.name.lower() in results[0].geometry
 
-
     @pytest.mark.parametrize('factor,npoints', [(0.0, 3), (1.0, 2)])
     def test_return_simplified_geometry(self, apiobj, frontend, factor, npoints):
         apiobj.add_placex(place_id=333, country_code='us',
@@ -162,7 +156,6 @@ class TestNameOnlySearches:
         assert result.place_id == 333
         assert len(geom['coordinates']) == npoints
 
-
     @pytest.mark.parametrize('viewbox', ['5.0,4.0,6.0,5.0', '5.7,4.0,6.0,5.0'])
     @pytest.mark.parametrize('wcount,rids', [(2, [100, 101]), (20000, [100])])
     def test_prefer_viewbox(self, apiobj, frontend, viewbox, wcount, rids):
@@ -177,18 +170,16 @@ class TestNameOnlySearches:
                              details=SearchDetails.from_kwargs({'viewbox': viewbox}))
         assert [r.place_id for r in results] == rids
 
-
     @pytest.mark.parametrize('viewbox', ['5.0,4.0,6.0,5.0', '5.55,4.27,5.62,4.31'])
     def test_force_viewbox(self, apiobj, frontend, viewbox):
         lookup = FieldLookup('name_vector', [1, 2], LookupAll)
 
-        details=SearchDetails.from_kwargs({'viewbox': viewbox,
-                                           'bounded_viewbox': True})
+        details = SearchDetails.from_kwargs({'viewbox': viewbox,
+                                             'bounded_viewbox': True})
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [], details=details)
         assert [r.place_id for r in results] == [100]
 
-
     def test_prefer_near(self, apiobj, frontend):
         lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.4, [RankedTokens(0.0, [21])])
@@ -202,13 +193,12 @@ class TestNameOnlySearches:
         results.sort(key=lambda r: -r.importance)
         assert [r.place_id for r in results] == [100, 101]
 
-
     @pytest.mark.parametrize('radius', [0.09, 0.11])
     def test_force_near(self, apiobj, frontend, radius):
         lookup = FieldLookup('name_vector', [1, 2], LookupAll)
 
-        details=SearchDetails.from_kwargs({'near': '5.6,4.3',
-                                           'near_radius': radius})
+        details = SearchDetails.from_kwargs({'near': '5.6,4.3',
+                                             'near_radius': radius})
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [], details=details)
 
@@ -228,7 +218,7 @@ class TestStreetWithHousenumber:
         apiobj.add_placex(place_id=1000, class_='highway', type='residential',
                           rank_search=26, rank_address=26,
                           country_code='es')
-        apiobj.add_search_name(1000, names=[1,2,10,11],
+        apiobj.add_search_name(1000, names=[1, 2, 10, 11],
                                search_rank=26, address_rank=26,
                                country_code='es')
         apiobj.add_placex(place_id=91, class_='place', type='house',
@@ -243,26 +233,24 @@ class TestStreetWithHousenumber:
         apiobj.add_placex(place_id=2000, class_='highway', type='residential',
                           rank_search=26, rank_address=26,
                           country_code='pt')
-        apiobj.add_search_name(2000, names=[1,2,20,21],
+        apiobj.add_search_name(2000, names=[1, 2, 20, 21],
                                search_rank=26, address_rank=26,
                                country_code='pt')
 
-
     @pytest.mark.parametrize('hnr,res', [('20', [91, 1]), ('20 a', [1]),
                                          ('21', [2]), ('22', [2, 92]),
                                          ('24', [93]), ('25', [])])
     def test_lookup_by_single_housenumber(self, apiobj, frontend, hnr, res):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking], hnrs=[hnr])
 
         assert [r.place_id for r in results] == res + [1000, 2000]
 
-
     @pytest.mark.parametrize('cc,res', [('es', [2, 1000]), ('pt', [92, 2000])])
     def test_lookup_with_country_restriction(self, apiobj, frontend, cc, res):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking], hnrs=['22'],
@@ -270,9 +258,8 @@ class TestStreetWithHousenumber:
 
         assert [r.place_id for r in results] == res
 
-
     def test_lookup_exclude_housenumber_placeid(self, apiobj, frontend):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking], hnrs=['22'],
@@ -280,9 +267,8 @@ class TestStreetWithHousenumber:
 
         assert [r.place_id for r in results] == [2, 1000, 2000]
 
-
     def test_lookup_exclude_street_placeid(self, apiobj, frontend):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking], hnrs=['22'],
@@ -290,9 +276,8 @@ class TestStreetWithHousenumber:
 
         assert [r.place_id for r in results] == [2, 92, 2000]
 
-
     def test_lookup_only_house_qualifier(self, apiobj, frontend):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking], hnrs=['22'],
@@ -300,9 +285,8 @@ class TestStreetWithHousenumber:
 
         assert [r.place_id for r in results] == [2, 92]
 
-
     def test_lookup_only_street_qualifier(self, apiobj, frontend):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking], hnrs=['22'],
@@ -310,10 +294,9 @@ class TestStreetWithHousenumber:
 
         assert [r.place_id for r in results] == [1000, 2000]
 
-
     @pytest.mark.parametrize('rank,found', [(26, True), (27, False), (30, False)])
     def test_lookup_min_rank(self, apiobj, frontend, rank, found):
-        lookup = FieldLookup('name_vector', [1,2], LookupAll)
+        lookup = FieldLookup('name_vector', [1, 2], LookupAll)
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, [lookup], [ranking], hnrs=['22'],
@@ -321,7 +304,6 @@ class TestStreetWithHousenumber:
 
         assert [r.place_id for r in results] == ([2, 92, 1000, 2000] if found else [2, 92])
 
-
     @pytest.mark.parametrize('geom', [napi.GeometryFormat.GEOJSON,
                                       napi.GeometryFormat.KML,
                                       napi.GeometryFormat.SVG,
@@ -343,7 +325,7 @@ def test_very_large_housenumber(apiobj, frontend):
     apiobj.add_placex(place_id=2000, class_='highway', type='residential',
                       rank_search=26, rank_address=26,
                       country_code='pt')
-    apiobj.add_search_name(2000, names=[1,2],
+    apiobj.add_search_name(2000, names=[1, 2],
                            search_rank=26, address_rank=26,
                            country_code='pt')
 
@@ -405,7 +387,6 @@ class TestInterpolations:
                            centroid=(10.0, 10.00001),
                            geometry='LINESTRING(9.995 10.00001, 10.005 10.00001)')
 
-
     @pytest.mark.parametrize('hnr,res', [('21', [992]), ('22', []), ('23', [991])])
     def test_lookup_housenumber(self, apiobj, frontend, hnr, res):
         lookup = FieldLookup('name_vector', [111], LookupAll)
@@ -414,7 +395,6 @@ class TestInterpolations:
 
         assert [r.place_id for r in results] == res + [990]
 
-
     @pytest.mark.parametrize('geom', [napi.GeometryFormat.GEOJSON,
                                       napi.GeometryFormat.KML,
                                       napi.GeometryFormat.SVG,
@@ -429,7 +409,6 @@ class TestInterpolations:
         assert geom.name.lower() in results[0].geometry
 
 
-
 class TestTiger:
 
     @pytest.fixture(autouse=True)
@@ -453,7 +432,6 @@ class TestTiger:
                          centroid=(10.0, 10.00001),
                          geometry='LINESTRING(9.995 10.00001, 10.005 10.00001)')
 
-
     @pytest.mark.parametrize('hnr,res', [('21', [992]), ('22', []), ('23', [991])])
     def test_lookup_housenumber(self, apiobj, frontend, hnr, res):
         lookup = FieldLookup('name_vector', [111], LookupAll)
@@ -462,7 +440,6 @@ class TestTiger:
 
         assert [r.place_id for r in results] == res + [990]
 
-
     @pytest.mark.parametrize('geom', [napi.GeometryFormat.GEOJSON,
                                       napi.GeometryFormat.KML,
                                       napi.GeometryFormat.SVG,
@@ -513,15 +490,15 @@ class TestLayersRank30:
                                importance=0.0005,
                                address_rank=0, search_rank=30)
 
-
-    @pytest.mark.parametrize('layer,res', [(napi.DataLayer.ADDRESS, [223]),
-                                           (napi.DataLayer.POI, [224]),
-                                           (napi.DataLayer.ADDRESS | napi.DataLayer.POI, [223, 224]),
-                                           (napi.DataLayer.MANMADE, [225]),
-                                           (napi.DataLayer.RAILWAY, [226]),
-                                           (napi.DataLayer.NATURAL, [227]),
-                                           (napi.DataLayer.MANMADE | napi.DataLayer.NATURAL, [225, 227]),
-                                           (napi.DataLayer.MANMADE | napi.DataLayer.RAILWAY, [225, 226])])
+    @pytest.mark.parametrize('layer,res',
+                             [(napi.DataLayer.ADDRESS, [223]),
+                              (napi.DataLayer.POI, [224]),
+                              (napi.DataLayer.ADDRESS | napi.DataLayer.POI, [223, 224]),
+                              (napi.DataLayer.MANMADE, [225]),
+                              (napi.DataLayer.RAILWAY, [226]),
+                              (napi.DataLayer.NATURAL, [227]),
+                              (napi.DataLayer.MANMADE | napi.DataLayer.NATURAL, [225, 227]),
+                              (napi.DataLayer.MANMADE | napi.DataLayer.RAILWAY, [225, 226])])
     def test_layers_rank30(self, apiobj, frontend, layer, res):
         lookup = FieldLookup('name_vector', [34], LookupAny)
 
diff --git a/test/python/api/search/test_search_poi.py b/test/python/api/search/test_search_poi.py
index d4319a57..9387385e 100644
--- a/test/python/api/search/test_search_poi.py
+++ b/test/python/api/search/test_search_poi.py
@@ -2,14 +2,13 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for running the POI searcher.
 """
 import pytest
 
-import nominatim_api as napi
 from nominatim_api.types import SearchDetails
 from nominatim_api.search.db_searches import PoiSearch
 from nominatim_api.search.db_search_fields import WeightedStrings, WeightedCategories
@@ -84,14 +83,12 @@ class TestPoiSearchWithRestrictions:
         else:
             self.args = {'near': '34.3, 56.100021', 'near_radius': 0.001}
 
-
     def test_unrestricted(self, apiobj, frontend):
         results = run_search(apiobj, frontend, 0.1, [('highway', 'bus_stop')], [0.5],
                              details=SearchDetails.from_kwargs(self.args))
 
         assert [r.place_id for r in results] == [1, 2]
 
-
     def test_restict_country(self, apiobj, frontend):
         results = run_search(apiobj, frontend, 0.1, [('highway', 'bus_stop')], [0.5],
                              ccodes=['de', 'nz'],
@@ -99,7 +96,6 @@ class TestPoiSearchWithRestrictions:
 
         assert [r.place_id for r in results] == [2]
 
-
     def test_restrict_by_viewbox(self, apiobj, frontend):
         args = {'bounded_viewbox': True, 'viewbox': '34.299,56.0,34.3001,56.10001'}
         args.update(self.args)
diff --git a/test/python/api/search/test_search_postcode.py b/test/python/api/search/test_search_postcode.py
index 369e1504..529fb409 100644
--- a/test/python/api/search/test_search_postcode.py
+++ b/test/python/api/search/test_search_postcode.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for running the postcode searcher.
@@ -15,6 +15,7 @@ from nominatim_api.search.db_searches import PostcodeSearch
 from nominatim_api.search.db_search_fields import WeightedStrings, FieldLookup, \
                                                   FieldRanking, RankedTokens
 
+
 def run_search(apiobj, frontend, global_penalty, pcs, pc_penalties=None,
                ccodes=[], lookup=[], ranking=[], details=SearchDetails()):
     if pc_penalties is None:
@@ -85,26 +86,24 @@ class TestPostcodeSearchWithAddress:
         apiobj.add_placex(place_id=1000, class_='place', type='village',
                           rank_search=22, rank_address=22,
                           country_code='ch')
-        apiobj.add_search_name(1000, names=[1,2,10,11],
+        apiobj.add_search_name(1000, names=[1, 2, 10, 11],
                                search_rank=22, address_rank=22,
                                country_code='ch')
         apiobj.add_placex(place_id=2000, class_='place', type='village',
                           rank_search=22, rank_address=22,
                           country_code='pl')
-        apiobj.add_search_name(2000, names=[1,2,20,21],
+        apiobj.add_search_name(2000, names=[1, 2, 20, 21],
                                search_rank=22, address_rank=22,
                                country_code='pl')
 
-
     def test_lookup_both(self, apiobj, frontend):
-        lookup = FieldLookup('name_vector', [1,2], 'restrict')
+        lookup = FieldLookup('name_vector', [1, 2], 'restrict')
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, ['12345'], lookup=[lookup], ranking=[ranking])
 
         assert [r.place_id for r in results] == [100, 101]
 
-
     def test_restrict_by_name(self, apiobj, frontend):
         lookup = FieldLookup('name_vector', [10], 'restrict')
 
@@ -112,11 +111,10 @@ class TestPostcodeSearchWithAddress:
 
         assert [r.place_id for r in results] == [100]
 
-
     @pytest.mark.parametrize('coord,place_id', [((16.5, 5), 100),
                                                 ((-45.1, 7.004), 101)])
     def test_lookup_near(self, apiobj, frontend, coord, place_id):
-        lookup = FieldLookup('name_vector', [1,2], 'restrict')
+        lookup = FieldLookup('name_vector', [1, 2], 'restrict')
         ranking = FieldRanking('name_vector', 0.3, [RankedTokens(0.0, [10])])
 
         results = run_search(apiobj, frontend, 0.1, ['12345'],
@@ -126,7 +124,6 @@ class TestPostcodeSearchWithAddress:
 
         assert [r.place_id for r in results] == [place_id]
 
-
     @pytest.mark.parametrize('geom', [napi.GeometryFormat.GEOJSON,
                                       napi.GeometryFormat.KML,
                                       napi.GeometryFormat.SVG,
@@ -138,18 +135,16 @@ class TestPostcodeSearchWithAddress:
         assert results
         assert all(geom.name.lower() in r.geometry for r in results)
 
-
-    @pytest.mark.parametrize('viewbox, rids', [('-46,6,-44,8', [101,100]),
-                                               ('16,4,18,6', [100,101])])
+    @pytest.mark.parametrize('viewbox, rids', [('-46,6,-44,8', [101, 100]),
+                                               ('16,4,18,6', [100, 101])])
     def test_prefer_viewbox(self, apiobj, frontend, viewbox, rids):
         results = run_search(apiobj, frontend, 0.1, ['12345'],
                              details=SearchDetails.from_kwargs({'viewbox': viewbox}))
 
         assert [r.place_id for r in results] == rids
 
-
     @pytest.mark.parametrize('viewbox, rid', [('-46,6,-44,8', 101),
-                                               ('16,4,18,6', 100)])
+                                              ('16,4,18,6', 100)])
     def test_restrict_to_viewbox(self, apiobj, frontend, viewbox, rid):
         results = run_search(apiobj, frontend, 0.1, ['12345'],
                              details=SearchDetails.from_kwargs({'viewbox': viewbox,
@@ -157,7 +152,6 @@ class TestPostcodeSearchWithAddress:
 
         assert [r.place_id for r in results] == [rid]
 
-
     @pytest.mark.parametrize('coord,rids', [((17.05, 5), [100, 101]),
                                             ((-45, 7.1), [101, 100])])
     def test_prefer_near(self, apiobj, frontend, coord, rids):
@@ -166,7 +160,6 @@ class TestPostcodeSearchWithAddress:
 
         assert [r.place_id for r in results] == rids
 
-
     @pytest.mark.parametrize('pid,rid', [(100, 101), (101, 100)])
     def test_exclude(self, apiobj, frontend, pid, rid):
         results = run_search(apiobj, frontend, 0.1, ['12345'],
diff --git a/test/python/api/search/test_token_assignment.py b/test/python/api/search/test_token_assignment.py
index 0d89ed5f..2ffba335 100644
--- a/test/python/api/search/test_token_assignment.py
+++ b/test/python/api/search/test_token_assignment.py
@@ -2,15 +2,19 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Test for creation of token assignments from tokenized queries.
 """
 import pytest
 
-from nominatim_api.search.query import QueryStruct, Phrase, PhraseType, BreakType, TokenType, TokenRange, Token
-from nominatim_api.search.token_assignment import yield_token_assignments, TokenAssignment, PENALTY_TOKENCHANGE
+from nominatim_api.search.query import QueryStruct, Phrase, TokenRange, Token
+import nominatim_api.search.query as qmod
+from nominatim_api.search.token_assignment import (yield_token_assignments,
+                                                   TokenAssignment,
+                                                   PENALTY_TOKENCHANGE)
+
 
 class MyToken(Token):
     def get_category(self):
@@ -24,7 +28,7 @@ def make_query(*args):
 
     for btype, ptype, _ in args[1:]:
         q.add_node(btype, ptype)
-    q.add_node(BreakType.END, PhraseType.NONE)
+    q.add_node(qmod.BREAK_END, qmod.PHRASE_ANY)
 
     for start, t in enumerate(args):
         for end, ttype in t[2]:
@@ -43,52 +47,52 @@ def check_assignments(actual, *expected):
 
 
 def test_query_with_missing_tokens():
-    q = QueryStruct([Phrase(PhraseType.NONE, '')])
-    q.add_node(BreakType.END, PhraseType.NONE)
+    q = QueryStruct([Phrase(qmod.PHRASE_ANY, '')])
+    q.add_node(qmod.BREAK_END, qmod.PHRASE_ANY)
 
     assert list(yield_token_assignments(q)) == []
 
 
 def test_one_word_query():
-    q = make_query((BreakType.START, PhraseType.NONE,
-                    [(1, TokenType.PARTIAL),
-                     (1, TokenType.WORD),
-                     (1, TokenType.HOUSENUMBER)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY,
+                    [(1, qmod.TOKEN_PARTIAL),
+                     (1, qmod.TOKEN_WORD),
+                     (1, qmod.TOKEN_HOUSENUMBER)]))
 
     res = list(yield_token_assignments(q))
     assert res == [TokenAssignment(name=TokenRange(0, 1))]
 
 
 def test_single_postcode():
-    q = make_query((BreakType.START, PhraseType.NONE,
-                    [(1, TokenType.POSTCODE)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY,
+                    [(1, qmod.TOKEN_POSTCODE)]))
 
     res = list(yield_token_assignments(q))
     assert res == [TokenAssignment(postcode=TokenRange(0, 1))]
 
 
 def test_single_country_name():
-    q = make_query((BreakType.START, PhraseType.NONE,
-                    [(1, TokenType.COUNTRY)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY,
+                    [(1, qmod.TOKEN_COUNTRY)]))
 
     res = list(yield_token_assignments(q))
     assert res == [TokenAssignment(country=TokenRange(0, 1))]
 
 
 def test_single_word_poi_search():
-    q = make_query((BreakType.START, PhraseType.NONE,
-                    [(1, TokenType.NEAR_ITEM),
-                     (1, TokenType.QUALIFIER)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY,
+                    [(1, qmod.TOKEN_NEAR_ITEM),
+                     (1, qmod.TOKEN_QUALIFIER)]))
 
     res = list(yield_token_assignments(q))
     assert res == [TokenAssignment(near_item=TokenRange(0, 1))]
 
 
-@pytest.mark.parametrize('btype', [BreakType.WORD, BreakType.PART, BreakType.TOKEN])
+@pytest.mark.parametrize('btype', [qmod.BREAK_WORD, qmod.BREAK_PART, qmod.BREAK_TOKEN])
 def test_multiple_simple_words(btype):
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (btype, PhraseType.NONE, [(2, TokenType.PARTIAL)]),
-                   (btype, PhraseType.NONE, [(3, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (btype, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]),
+                   (btype, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]))
 
     penalty = PENALTY_TOKENCHANGE[btype]
 
@@ -101,13 +105,12 @@ def test_multiple_simple_words(btype):
                       TokenAssignment(penalty=penalty, name=TokenRange(1, 3),
                                       address=[TokenRange(0, 1)]),
                       TokenAssignment(penalty=penalty, name=TokenRange(2, 3),
-                                      address=[TokenRange(0, 2)])
-                     )
+                                      address=[TokenRange(0, 2)]))
 
 
 def test_multiple_words_respect_phrase_break():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(2, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(name=TokenRange(0, 1),
@@ -117,8 +120,8 @@ def test_multiple_words_respect_phrase_break():
 
 
 def test_housenumber_and_street():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.HOUSENUMBER)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(2, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_HOUSENUMBER)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(name=TokenRange(1, 2),
@@ -128,8 +131,8 @@ def test_housenumber_and_street():
 
 
 def test_housenumber_and_street_backwards():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(2, TokenType.HOUSENUMBER)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(2, qmod.TOKEN_HOUSENUMBER)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(name=TokenRange(0, 1),
@@ -139,10 +142,10 @@ def test_housenumber_and_street_backwards():
 
 
 def test_housenumber_and_postcode():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.HOUSENUMBER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(4, TokenType.POSTCODE)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_HOUSENUMBER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(4, qmod.TOKEN_POSTCODE)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=pytest.approx(0.3),
@@ -155,11 +158,12 @@ def test_housenumber_and_postcode():
                                       address=[TokenRange(0, 1), TokenRange(2, 3)],
                                       postcode=TokenRange(3, 4)))
 
+
 def test_postcode_and_housenumber():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.POSTCODE)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(4, TokenType.HOUSENUMBER)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_POSTCODE)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(4, qmod.TOKEN_HOUSENUMBER)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=pytest.approx(0.3),
@@ -174,54 +178,54 @@ def test_postcode_and_housenumber():
 
 
 def test_country_housenumber_postcode():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.COUNTRY)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.HOUSENUMBER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(4, TokenType.POSTCODE)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_COUNTRY)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_HOUSENUMBER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(4, qmod.TOKEN_POSTCODE)]))
 
     check_assignments(yield_token_assignments(q))
 
 
-@pytest.mark.parametrize('ttype', [TokenType.POSTCODE, TokenType.COUNTRY,
-                                   TokenType.NEAR_ITEM, TokenType.QUALIFIER])
+@pytest.mark.parametrize('ttype', [qmod.TOKEN_POSTCODE, qmod.TOKEN_COUNTRY,
+                                   qmod.TOKEN_NEAR_ITEM, qmod.TOKEN_QUALIFIER])
 def test_housenumber_with_only_special_terms(ttype):
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.HOUSENUMBER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, ttype)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_HOUSENUMBER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, ttype)]))
 
     check_assignments(yield_token_assignments(q))
 
 
-@pytest.mark.parametrize('ttype', [TokenType.POSTCODE, TokenType.HOUSENUMBER, TokenType.COUNTRY])
+@pytest.mark.parametrize('ttype', [qmod.TOKEN_POSTCODE, qmod.TOKEN_HOUSENUMBER, qmod.TOKEN_COUNTRY])
 def test_multiple_special_tokens(ttype):
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, ttype)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(2, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(3, ttype)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, ttype)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(3, ttype)]))
 
     check_assignments(yield_token_assignments(q))
 
 
 def test_housenumber_many_phrases():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(2, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(3, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(4, TokenType.HOUSENUMBER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(5, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(4, qmod.TOKEN_HOUSENUMBER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(5, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=0.1,
                                       name=TokenRange(4, 5),
-                                      housenumber=TokenRange(3, 4),\
+                                      housenumber=TokenRange(3, 4),
                                       address=[TokenRange(0, 1), TokenRange(1, 2),
                                                TokenRange(2, 3)]),
                       TokenAssignment(penalty=0.1,
-                                      housenumber=TokenRange(3, 4),\
+                                      housenumber=TokenRange(3, 4),
                                       address=[TokenRange(0, 1), TokenRange(1, 2),
                                                TokenRange(2, 3), TokenRange(4, 5)]))
 
 
 def test_country_at_beginning():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.COUNTRY)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_COUNTRY)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=0.1, name=TokenRange(1, 2),
@@ -229,8 +233,8 @@ def test_country_at_beginning():
 
 
 def test_country_at_end():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.COUNTRY)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_COUNTRY)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=0.1, name=TokenRange(0, 1),
@@ -238,16 +242,16 @@ def test_country_at_end():
 
 
 def test_country_in_middle():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.COUNTRY)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_COUNTRY)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q))
 
 
 def test_postcode_with_designation():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.POSTCODE)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(2, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_POSTCODE)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=0.1, name=TokenRange(1, 2),
@@ -257,8 +261,8 @@ def test_postcode_with_designation():
 
 
 def test_postcode_with_designation_backwards():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(2, TokenType.POSTCODE)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(2, qmod.TOKEN_POSTCODE)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(name=TokenRange(0, 1),
@@ -268,8 +272,8 @@ def test_postcode_with_designation_backwards():
 
 
 def test_near_item_at_beginning():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.NEAR_ITEM)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_NEAR_ITEM)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=0.1, name=TokenRange(1, 2),
@@ -277,8 +281,8 @@ def test_near_item_at_beginning():
 
 
 def test_near_item_at_end():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.NEAR_ITEM)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_NEAR_ITEM)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=0.1, name=TokenRange(0, 1),
@@ -286,18 +290,17 @@ def test_near_item_at_end():
 
 
 def test_near_item_in_middle():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.NEAR_ITEM)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_NEAR_ITEM)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q))
 
 
 def test_qualifier_at_beginning():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.QUALIFIER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.PARTIAL)]))
-
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_QUALIFIER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=0.1, name=TokenRange(1, 3),
@@ -308,12 +311,11 @@ def test_qualifier_at_beginning():
 
 
 def test_qualifier_after_name():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.QUALIFIER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(4, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(5, TokenType.PARTIAL)]))
-
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_QUALIFIER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(4, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(5, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q),
                       TokenAssignment(penalty=0.2, name=TokenRange(0, 2),
@@ -325,27 +327,26 @@ def test_qualifier_after_name():
 
 
 def test_qualifier_before_housenumber():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.QUALIFIER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.HOUSENUMBER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_QUALIFIER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_HOUSENUMBER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q))
 
 
 def test_qualifier_after_housenumber():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.HOUSENUMBER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(2, TokenType.QUALIFIER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_HOUSENUMBER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(2, qmod.TOKEN_QUALIFIER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q))
 
 
 def test_qualifier_in_middle_of_phrase():
-    q = make_query((BreakType.START, PhraseType.NONE, [(1, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(2, TokenType.PARTIAL)]),
-                   (BreakType.WORD, PhraseType.NONE, [(3, TokenType.QUALIFIER)]),
-                   (BreakType.WORD, PhraseType.NONE, [(4, TokenType.PARTIAL)]),
-                   (BreakType.PHRASE, PhraseType.NONE, [(5, TokenType.PARTIAL)]))
+    q = make_query((qmod.BREAK_START, qmod.PHRASE_ANY, [(1, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(2, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(3, qmod.TOKEN_QUALIFIER)]),
+                   (qmod.BREAK_WORD, qmod.PHRASE_ANY, [(4, qmod.TOKEN_PARTIAL)]),
+                   (qmod.BREAK_PHRASE, qmod.PHRASE_ANY, [(5, qmod.TOKEN_PARTIAL)]))
 
     check_assignments(yield_token_assignments(q))
-
diff --git a/test/python/api/test_api_connection.py b/test/python/api/test_api_connection.py
index f62b0d9e..9b29411a 100644
--- a/test/python/api/test_api_connection.py
+++ b/test/python/api/test_api_connection.py
@@ -2,12 +2,11 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for enhanced connection class for API functions.
 """
-from pathlib import Path
 import pytest
 
 import sqlalchemy as sa
@@ -76,7 +75,7 @@ async def test_get_db_property_existing(api):
 
 
 @pytest.mark.asyncio
-async def test_get_db_property_existing(api):
+async def test_get_db_property_bad_name(api):
     async with api.begin() as conn:
         with pytest.raises(ValueError):
             await conn.get_db_property('dfkgjd.rijg')
diff --git a/test/python/api/test_api_deletable_v1.py b/test/python/api/test_api_deletable_v1.py
index 9e113886..8ea4c9cd 100644
--- a/test/python/api/test_api_deletable_v1.py
+++ b/test/python/api/test_api_deletable_v1.py
@@ -2,20 +2,20 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the deletable v1 API call.
 """
 import json
-from pathlib import Path
 
 import pytest
 
-from fake_adaptor import FakeAdaptor, FakeError, FakeResponse
+from fake_adaptor import FakeAdaptor
 
 import nominatim_api.v1.server_glue as glue
 
+
 class TestDeletableEndPoint:
 
     @pytest.fixture(autouse=True)
@@ -25,14 +25,13 @@ class TestDeletableEndPoint:
                       content=[(345, 'N', 'boundary', 'administrative'),
                                (781, 'R', 'landuse', 'wood'),
                                (781, 'R', 'landcover', 'grass')])
-        table_factory('placex',
-                      definition="""place_id bigint, osm_id bigint, osm_type char(1),
-                                    class text, type text, name HSTORE, country_code char(2)""",
-                      content=[(1, 345, 'N', 'boundary', 'administrative', {'old_name': 'Former'}, 'ab'),
-                               (2, 781, 'R', 'landuse', 'wood', {'name': 'Wood'}, 'cd'),
-                               (3, 781, 'R', 'landcover', 'grass', None, 'cd')])
-
-
+        table_factory(
+            'placex',
+            definition="""place_id bigint, osm_id bigint, osm_type char(1),
+                          class text, type text, name HSTORE, country_code char(2)""",
+            content=[(1, 345, 'N', 'boundary', 'administrative', {'old_name': 'Former'}, 'ab'),
+                     (2, 781, 'R', 'landuse', 'wood', {'name': 'Wood'}, 'cd'),
+                     (3, 781, 'R', 'landcover', 'grass', None, 'cd')])
 
     @pytest.mark.asyncio
     async def test_deletable(self, api):
diff --git a/test/python/api/test_api_details.py b/test/python/api/test_api_details.py
index 7f405728..4f6dd92b 100644
--- a/test/python/api/test_api_details.py
+++ b/test/python/api/test_api_details.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for details API call.
@@ -13,23 +13,24 @@ import pytest
 
 import nominatim_api as napi
 
+
 @pytest.mark.parametrize('idobj', (napi.PlaceID(332), napi.OsmID('W', 4),
                                    napi.OsmID('W', 4, 'highway')))
 def test_lookup_in_placex(apiobj, frontend, idobj):
     import_date = dt.datetime(2022, 12, 7, 14, 14, 46, 0)
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',
-                     name={'name': 'Road'}, address={'city': 'Barrow'},
-                     extratags={'surface': 'paved'},
-                     parent_place_id=34, linked_place_id=55,
-                     admin_level=15, country_code='gb',
-                     housenumber='4',
-                     postcode='34425', wikipedia='en:Faa',
-                     rank_search=27, rank_address=26,
-                     importance=0.01,
-                     centroid=(23, 34),
-                     indexed_date=import_date,
-                     geometry='LINESTRING(23 34, 23.1 34, 23.1 34.1, 23 34)')
+                      class_='highway', type='residential',
+                      name={'name': 'Road'}, address={'city': 'Barrow'},
+                      extratags={'surface': 'paved'},
+                      parent_place_id=34, linked_place_id=55,
+                      admin_level=15, country_code='gb',
+                      housenumber='4',
+                      postcode='34425', wikipedia='en:Faa',
+                      rank_search=27, rank_address=26,
+                      importance=0.01,
+                      centroid=(23, 34),
+                      indexed_date=import_date,
+                      geometry='LINESTRING(23 34, 23.1 34, 23.1 34.1, 23 34)')
 
     api = frontend(apiobj, options={'details'})
     result = api.details(idobj)
@@ -73,12 +74,12 @@ def test_lookup_in_placex(apiobj, frontend, idobj):
 def test_lookup_in_placex_minimal_info(apiobj, frontend):
     import_date = dt.datetime(2022, 12, 7, 14, 14, 46, 0)
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',
-                     admin_level=15,
-                     rank_search=27, rank_address=26,
-                     centroid=(23, 34),
-                     indexed_date=import_date,
-                     geometry='LINESTRING(23 34, 23.1 34, 23.1 34.1, 23 34)')
+                      class_='highway', type='residential',
+                      admin_level=15,
+                      rank_search=27, rank_address=26,
+                      centroid=(23, 34),
+                      indexed_date=import_date,
+                      geometry='LINESTRING(23 34, 23.1 34, 23.1 34.1, 23 34)')
 
     api = frontend(apiobj, options={'details'})
     result = api.details(napi.PlaceID(332))
@@ -131,9 +132,9 @@ def test_lookup_in_placex_with_geometry(apiobj, frontend):
 
 def test_lookup_placex_with_address_details(apiobj, frontend):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl',
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl',
+                      rank_search=27, rank_address=26)
     apiobj.add_address_placex(332, fromarea=False, isaddress=False,
                               distance=0.0034,
                               place_id=1000, osm_type='N', osm_id=3333,
@@ -178,9 +179,9 @@ def test_lookup_placex_with_address_details(apiobj, frontend):
 
 def test_lookup_place_with_linked_places_none_existing(apiobj, frontend):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl', linked_place_id=45,
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl', linked_place_id=45,
+                      rank_search=27, rank_address=26)
 
     api = frontend(apiobj, options={'details'})
     result = api.details(napi.PlaceID(332), linked_places=True)
@@ -190,17 +191,17 @@ def test_lookup_place_with_linked_places_none_existing(apiobj, frontend):
 
 def test_lookup_place_with_linked_places_existing(apiobj, frontend):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl', linked_place_id=45,
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl', linked_place_id=45,
+                      rank_search=27, rank_address=26)
     apiobj.add_placex(place_id=1001, osm_type='W', osm_id=5,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl', linked_place_id=332,
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl', linked_place_id=332,
+                      rank_search=27, rank_address=26)
     apiobj.add_placex(place_id=1002, osm_type='W', osm_id=6,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl', linked_place_id=332,
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl', linked_place_id=332,
+                      rank_search=27, rank_address=26)
 
     api = frontend(apiobj, options={'details'})
     result = api.details(napi.PlaceID(332), linked_places=True)
@@ -221,9 +222,9 @@ def test_lookup_place_with_linked_places_existing(apiobj, frontend):
 
 def test_lookup_place_with_parented_places_not_existing(apiobj, frontend):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl', parent_place_id=45,
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl', parent_place_id=45,
+                      rank_search=27, rank_address=26)
 
     api = frontend(apiobj, options={'details'})
     result = api.details(napi.PlaceID(332), parented_places=True)
@@ -233,17 +234,17 @@ def test_lookup_place_with_parented_places_not_existing(apiobj, frontend):
 
 def test_lookup_place_with_parented_places_existing(apiobj, frontend):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl', parent_place_id=45,
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl', parent_place_id=45,
+                      rank_search=27, rank_address=26)
     apiobj.add_placex(place_id=1001, osm_type='N', osm_id=5,
-                     class_='place', type='house', housenumber='23',
-                     country_code='pl', parent_place_id=332,
-                     rank_search=30, rank_address=30)
+                      class_='place', type='house', housenumber='23',
+                      country_code='pl', parent_place_id=332,
+                      rank_search=30, rank_address=30)
     apiobj.add_placex(place_id=1002, osm_type='W', osm_id=6,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl', parent_place_id=332,
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl', parent_place_id=332,
+                      rank_search=27, rank_address=26)
 
     api = frontend(apiobj, options={'details'})
     result = api.details(napi.PlaceID(332), parented_places=True)
@@ -332,9 +333,9 @@ def test_lookup_osmline_with_address_details(apiobj, frontend):
                        startnumber=2, endnumber=4, step=1,
                        parent_place_id=332)
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl',
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl',
+                      rank_search=27, rank_address=26)
     apiobj.add_address_placex(332, fromarea=False, isaddress=False,
                               distance=0.0034,
                               place_id=1000, osm_type='N', osm_id=3333,
@@ -432,9 +433,9 @@ def test_lookup_tiger_with_address_details(apiobj, frontend):
                      startnumber=2, endnumber=4, step=1,
                      parent_place_id=332)
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='us',
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='us',
+                      rank_search=27, rank_address=26)
     apiobj.add_address_placex(332, fromarea=False, isaddress=False,
                               distance=0.0034,
                               place_id=1000, osm_type='N', osm_id=3333,
@@ -571,6 +572,7 @@ def test_lookup_postcode_with_address_details(apiobj, frontend):
                                 rank_address=4, distance=0.0)
            ]
 
+
 @pytest.mark.parametrize('objid', [napi.PlaceID(1736),
                                    napi.OsmID('W', 55),
                                    napi.OsmID('N', 55, 'amenity')])
@@ -583,8 +585,8 @@ def test_lookup_missing_object(apiobj, frontend, objid):
 
 
 @pytest.mark.parametrize('gtype', (napi.GeometryFormat.KML,
-                                    napi.GeometryFormat.SVG,
-                                    napi.GeometryFormat.TEXT))
+                                   napi.GeometryFormat.SVG,
+                                   napi.GeometryFormat.TEXT))
 def test_lookup_unsupported_geometry(apiobj, frontend, gtype):
     apiobj.add_placex(place_id=332)
 
diff --git a/test/python/api/test_api_lookup.py b/test/python/api/test_api_lookup.py
index 4281cd6c..a2660f51 100644
--- a/test/python/api/test_api_lookup.py
+++ b/test/python/api/test_api_lookup.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for lookup API call.
@@ -13,6 +13,7 @@ import pytest
 
 import nominatim_api as napi
 
+
 def test_lookup_empty_list(apiobj, frontend):
     api = frontend(apiobj, options={'details'})
     assert api.lookup([]) == []
@@ -28,17 +29,17 @@ def test_lookup_non_existing(apiobj, frontend):
                                    napi.OsmID('W', 4, 'highway')))
 def test_lookup_single_placex(apiobj, frontend, idobj):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',
-                     name={'name': 'Road'}, address={'city': 'Barrow'},
-                     extratags={'surface': 'paved'},
-                     parent_place_id=34, linked_place_id=55,
-                     admin_level=15, country_code='gb',
-                     housenumber='4',
-                     postcode='34425', wikipedia='en:Faa',
-                     rank_search=27, rank_address=26,
-                     importance=0.01,
-                     centroid=(23, 34),
-                     geometry='LINESTRING(23 34, 23.1 34, 23.1 34.1, 23 34)')
+                      class_='highway', type='residential',
+                      name={'name': 'Road'}, address={'city': 'Barrow'},
+                      extratags={'surface': 'paved'},
+                      parent_place_id=34, linked_place_id=55,
+                      admin_level=15, country_code='gb',
+                      housenumber='4',
+                      postcode='34425', wikipedia='en:Faa',
+                      rank_search=27, rank_address=26,
+                      importance=0.01,
+                      centroid=(23, 34),
+                      geometry='LINESTRING(23 34, 23.1 34, 23.1 34.1, 23 34)')
 
     api = frontend(apiobj, options={'details'})
     result = api.lookup([idobj])
@@ -79,17 +80,17 @@ def test_lookup_single_placex(apiobj, frontend, idobj):
 
 def test_lookup_multiple_places(apiobj, frontend):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',
-                     name={'name': 'Road'}, address={'city': 'Barrow'},
-                     extratags={'surface': 'paved'},
-                     parent_place_id=34, linked_place_id=55,
-                     admin_level=15, country_code='gb',
-                     housenumber='4',
-                     postcode='34425', wikipedia='en:Faa',
-                     rank_search=27, rank_address=26,
-                     importance=0.01,
-                     centroid=(23, 34),
-                     geometry='LINESTRING(23 34, 23.1 34, 23.1 34.1, 23 34)')
+                      class_='highway', type='residential',
+                      name={'name': 'Road'}, address={'city': 'Barrow'},
+                      extratags={'surface': 'paved'},
+                      parent_place_id=34, linked_place_id=55,
+                      admin_level=15, country_code='gb',
+                      housenumber='4',
+                      postcode='34425', wikipedia='en:Faa',
+                      rank_search=27, rank_address=26,
+                      importance=0.01,
+                      centroid=(23, 34),
+                      geometry='LINESTRING(23 34, 23.1 34, 23.1 34.1, 23 34)')
     apiobj.add_osmline(place_id=4924, osm_id=9928,
                        parent_place_id=12,
                        startnumber=1, endnumber=4, step=1,
@@ -97,7 +98,6 @@ def test_lookup_multiple_places(apiobj, frontend):
                        address={'city': 'Big'},
                        geometry='LINESTRING(23 34, 23 35)')
 
-
     api = frontend(apiobj, options={'details'})
     result = api.lookup((napi.OsmID('W', 1),
                          napi.OsmID('W', 4),
@@ -111,17 +111,17 @@ def test_lookup_multiple_places(apiobj, frontend):
 @pytest.mark.parametrize('gtype', list(napi.GeometryFormat))
 def test_simple_place_with_geometry(apiobj, frontend, gtype):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',
-                     name={'name': 'Road'}, address={'city': 'Barrow'},
-                     extratags={'surface': 'paved'},
-                     parent_place_id=34, linked_place_id=55,
-                     admin_level=15, country_code='gb',
-                     housenumber='4',
-                     postcode='34425', wikipedia='en:Faa',
-                     rank_search=27, rank_address=26,
-                     importance=0.01,
-                     centroid=(23, 34),
-                     geometry='POLYGON((23 34, 23.1 34, 23.1 34.1, 23 34))')
+                      class_='highway', type='residential',
+                      name={'name': 'Road'}, address={'city': 'Barrow'},
+                      extratags={'surface': 'paved'},
+                      parent_place_id=34, linked_place_id=55,
+                      admin_level=15, country_code='gb',
+                      housenumber='4',
+                      postcode='34425', wikipedia='en:Faa',
+                      rank_search=27, rank_address=26,
+                      importance=0.01,
+                      centroid=(23, 34),
+                      geometry='POLYGON((23 34, 23.1 34, 23.1 34.1, 23 34))')
 
     api = frontend(apiobj, options={'details'})
     result = api.lookup([napi.OsmID('W', 4)], geometry_output=gtype)
@@ -137,17 +137,17 @@ def test_simple_place_with_geometry(apiobj, frontend, gtype):
 
 def test_simple_place_with_geometry_simplified(apiobj, frontend):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',
-                     name={'name': 'Road'}, address={'city': 'Barrow'},
-                     extratags={'surface': 'paved'},
-                     parent_place_id=34, linked_place_id=55,
-                     admin_level=15, country_code='gb',
-                     housenumber='4',
-                     postcode='34425', wikipedia='en:Faa',
-                     rank_search=27, rank_address=26,
-                     importance=0.01,
-                     centroid=(23, 34),
-                     geometry='POLYGON((23 34, 22.999 34, 23.1 34, 23.1 34.1, 23 34))')
+                      class_='highway', type='residential',
+                      name={'name': 'Road'}, address={'city': 'Barrow'},
+                      extratags={'surface': 'paved'},
+                      parent_place_id=34, linked_place_id=55,
+                      admin_level=15, country_code='gb',
+                      housenumber='4',
+                      postcode='34425', wikipedia='en:Faa',
+                      rank_search=27, rank_address=26,
+                      importance=0.01,
+                      centroid=(23, 34),
+                      geometry='POLYGON((23 34, 22.999 34, 23.1 34, 23.1 34.1, 23 34))')
 
     api = frontend(apiobj, options={'details'})
     result = api.lookup([napi.OsmID('W', 4)],
@@ -159,5 +159,5 @@ def test_simple_place_with_geometry_simplified(apiobj, frontend):
 
     geom = json.loads(result[0].geometry['geojson'])
 
-    assert geom['type']  == 'Polygon'
+    assert geom['type'] == 'Polygon'
     assert geom['coordinates'] == [[[23, 34], [23.1, 34], [23.1, 34.1], [23, 34]]]
diff --git a/test/python/api/test_api_polygons_v1.py b/test/python/api/test_api_polygons_v1.py
index ac2b4cb9..e4700a95 100644
--- a/test/python/api/test_api_polygons_v1.py
+++ b/test/python/api/test_api_polygons_v1.py
@@ -2,21 +2,21 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the deletable v1 API call.
 """
 import json
 import datetime as dt
-from pathlib import Path
 
 import pytest
 
-from fake_adaptor import FakeAdaptor, FakeError, FakeResponse
+from fake_adaptor import FakeAdaptor
 
 import nominatim_api.v1.server_glue as glue
 
+
 class TestPolygonsEndPoint:
 
     @pytest.fixture(autouse=True)
@@ -35,13 +35,12 @@ class TestPolygonsEndPoint:
                                     errormessage text,
                                     prevgeometry geometry(Geometry,4326),
                                     newgeometry geometry(Geometry,4326)""",
-                    content=[(345, 'N', 'boundary', 'administrative',
-                              {'name': 'Foo'}, 'xx', self.recent,
-                              'some text', None, None),
-                             (781, 'R', 'landuse', 'wood',
-                              None, 'ds', self.now,
-                              'Area reduced by lots', None, None)])
-
+                      content=[(345, 'N', 'boundary', 'administrative',
+                               {'name': 'Foo'}, 'xx', self.recent,
+                               'some text', None, None),
+                               (781, 'R', 'landuse', 'wood',
+                                None, 'ds', self.now,
+                                'Area reduced by lots', None, None)])
 
     @pytest.mark.asyncio
     async def test_polygons_simple(self, api):
@@ -63,7 +62,6 @@ class TestPolygonsEndPoint:
                             'errormessage': 'Area reduced by lots',
                             'updated': self.now.isoformat(sep=' ', timespec='seconds')}]
 
-
     @pytest.mark.asyncio
     async def test_polygons_days(self, api):
         a = FakeAdaptor()
@@ -74,7 +72,6 @@ class TestPolygonsEndPoint:
 
         assert [r['osm_id'] for r in results] == [781]
 
-
     @pytest.mark.asyncio
     async def test_polygons_class(self, api):
         a = FakeAdaptor()
@@ -85,8 +82,6 @@ class TestPolygonsEndPoint:
 
         assert [r['osm_id'] for r in results] == [781]
 
-
-
     @pytest.mark.asyncio
     async def test_polygons_reduced(self, api):
         a = FakeAdaptor()
diff --git a/test/python/api/test_api_reverse.py b/test/python/api/test_api_reverse.py
index ff7f402b..d7d3ba7e 100644
--- a/test/python/api/test_api_reverse.py
+++ b/test/python/api/test_api_reverse.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for reverse API call.
@@ -18,6 +18,7 @@ import nominatim_api as napi
 
 API_OPTIONS = {'reverse'}
 
+
 def test_reverse_rank_30(apiobj, frontend):
     apiobj.add_placex(place_id=223, class_='place', type='house',
                       housenumber='1',
@@ -35,7 +36,7 @@ def test_reverse_rank_30(apiobj, frontend):
 def test_reverse_street(apiobj, frontend, country):
     apiobj.add_placex(place_id=990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'My Street'},
+                      name={'name': 'My Street'},
                       centroid=(10.0, 10.0),
                       country_code=country,
                       geometry='LINESTRING(9.995 10, 10.005 10)')
@@ -57,16 +58,18 @@ def test_reverse_ignore_unindexed(apiobj, frontend):
     assert result is None
 
 
-@pytest.mark.parametrize('y,layer,place_id', [(0.7, napi.DataLayer.ADDRESS, 223),
-                                              (0.70001, napi.DataLayer.POI, 224),
-                                              (0.7, napi.DataLayer.ADDRESS | napi.DataLayer.POI, 224),
-                                              (0.70001, napi.DataLayer.ADDRESS | napi.DataLayer.POI, 223),
-                                              (0.7, napi.DataLayer.MANMADE, 225),
-                                              (0.7, napi.DataLayer.RAILWAY, 226),
-                                              (0.7, napi.DataLayer.NATURAL, 227),
-                                              (0.70003, napi.DataLayer.MANMADE | napi.DataLayer.RAILWAY, 225),
-                                              (0.70003, napi.DataLayer.MANMADE | napi.DataLayer.NATURAL, 225),
-                                              (5, napi.DataLayer.ADDRESS, 229)])
+@pytest.mark.parametrize('y,layer,place_id',
+                         [(0.7, napi.DataLayer.ADDRESS, 223),
+                          (0.70001, napi.DataLayer.POI, 224),
+                          (0.7, napi.DataLayer.ADDRESS | napi.DataLayer.POI, 224),
+                          (0.70001, napi.DataLayer.ADDRESS | napi.DataLayer.POI, 223),
+                          (0.7, napi.DataLayer.MANMADE, 225),
+                          (0.7, napi.DataLayer.RAILWAY, 226),
+                          (0.7, napi.DataLayer.NATURAL, 227),
+                          (0.70003, napi.DataLayer.MANMADE | napi.DataLayer.RAILWAY, 225),
+                          (0.70003, napi.DataLayer.MANMADE | napi.DataLayer.NATURAL, 225),
+                          (5, napi.DataLayer.ADDRESS, 229),
+                          (5.0001, napi.DataLayer.ADDRESS, 229)])
 def test_reverse_rank_30_layers(apiobj, frontend, y, layer, place_id):
     apiobj.add_placex(place_id=223, osm_type='N', class_='place', type='house',
                       housenumber='1',
@@ -94,6 +97,12 @@ def test_reverse_rank_30_layers(apiobj, frontend, y, layer, place_id):
                       rank_address=30,
                       rank_search=30,
                       centroid=(1.3, 5))
+    apiobj.add_placex(place_id=230, class_='place', type='house',
+                      housenumber='2',
+                      address={'_inherited': ''},
+                      rank_address=30,
+                      rank_search=30,
+                      centroid=(1.3, 5.0001))
 
     api = frontend(apiobj, options=API_OPTIONS)
     assert api.reverse((1.3, y), layers=layer).place_id == place_id
@@ -108,14 +117,14 @@ def test_reverse_poi_layer_with_no_pois(apiobj, frontend):
 
     api = frontend(apiobj, options=API_OPTIONS)
     assert api.reverse((1.3, 0.70001), max_rank=29,
-                              layers=napi.DataLayer.POI) is None
+                       layers=napi.DataLayer.POI) is None
 
 
 @pytest.mark.parametrize('with_geom', [True, False])
 def test_reverse_housenumber_on_street(apiobj, frontend, with_geom):
     apiobj.add_placex(place_id=990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'My Street'},
+                      name={'name': 'My Street'},
                       centroid=(10.0, 10.0),
                       geometry='LINESTRING(9.995 10, 10.005 10)')
     apiobj.add_placex(place_id=991, class_='place', type='house',
@@ -125,7 +134,7 @@ def test_reverse_housenumber_on_street(apiobj, frontend, with_geom):
                       centroid=(10.0, 10.00001))
     apiobj.add_placex(place_id=1990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'Other Street'},
+                      name={'name': 'Other Street'},
                       centroid=(10.0, 1.0),
                       geometry='LINESTRING(9.995 1, 10.005 1)')
     apiobj.add_placex(place_id=1991, class_='place', type='house',
@@ -147,7 +156,7 @@ def test_reverse_housenumber_on_street(apiobj, frontend, with_geom):
 def test_reverse_housenumber_interpolation(apiobj, frontend, with_geom):
     apiobj.add_placex(place_id=990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'My Street'},
+                      name={'name': 'My Street'},
                       centroid=(10.0, 10.0),
                       geometry='LINESTRING(9.995 10, 10.005 10)')
     apiobj.add_placex(place_id=991, class_='place', type='house',
@@ -162,7 +171,7 @@ def test_reverse_housenumber_interpolation(apiobj, frontend, with_geom):
                        geometry='LINESTRING(9.995 10.00001, 10.005 10.00001)')
     apiobj.add_placex(place_id=1990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'Other Street'},
+                      name={'name': 'Other Street'},
                       centroid=(10.0, 20.0),
                       geometry='LINESTRING(9.995 20, 10.005 20)')
     apiobj.add_osmline(place_id=1992,
@@ -181,7 +190,7 @@ def test_reverse_housenumber_interpolation(apiobj, frontend, with_geom):
 def test_reverse_housenumber_point_interpolation(apiobj, frontend):
     apiobj.add_placex(place_id=990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'My Street'},
+                      name={'name': 'My Street'},
                       centroid=(10.0, 10.0),
                       geometry='LINESTRING(9.995 10, 10.005 10)')
     apiobj.add_osmline(place_id=992,
@@ -199,7 +208,7 @@ def test_reverse_housenumber_point_interpolation(apiobj, frontend):
 def test_reverse_tiger_number(apiobj, frontend):
     apiobj.add_placex(place_id=990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'My Street'},
+                      name={'name': 'My Street'},
                       centroid=(10.0, 10.0),
                       country_code='us',
                       geometry='LINESTRING(9.995 10, 10.005 10)')
@@ -217,7 +226,7 @@ def test_reverse_tiger_number(apiobj, frontend):
 def test_reverse_point_tiger(apiobj, frontend):
     apiobj.add_placex(place_id=990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'My Street'},
+                      name={'name': 'My Street'},
                       centroid=(10.0, 10.0),
                       country_code='us',
                       geometry='LINESTRING(9.995 10, 10.005 10)')
@@ -393,14 +402,15 @@ def test_reverse_interpolation_geometry(apiobj, frontend):
                        geometry='LINESTRING(9.995 10.00001, 10.005 10.00001)')
 
     api = frontend(apiobj, options=API_OPTIONS)
-    assert api.reverse((10.0, 10.0), geometry_output=napi.GeometryFormat.TEXT)\
-                     .geometry['text'] == 'POINT(10 10.00001)'
+    result = api.reverse((10.0, 10.0), geometry_output=napi.GeometryFormat.TEXT)
+
+    assert result.geometry['text'] == 'POINT(10 10.00001)'
 
 
 def test_reverse_tiger_geometry(apiobj, frontend):
     apiobj.add_placex(place_id=990, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'My Street'},
+                      name={'name': 'My Street'},
                       centroid=(10.0, 10.0),
                       country_code='us',
                       geometry='LINESTRING(9.995 10, 10.005 10)')
@@ -411,7 +421,7 @@ def test_reverse_tiger_geometry(apiobj, frontend):
                      geometry='LINESTRING(9.995 10.00001, 10.005 10.00001)')
     apiobj.add_placex(place_id=1000, class_='highway', type='service',
                       rank_search=27, rank_address=27,
-                      name = {'name': 'My Street'},
+                      name={'name': 'My Street'},
                       centroid=(11.0, 11.0),
                       country_code='us',
                       geometry='LINESTRING(10.995 11, 11.005 11)')
@@ -426,8 +436,9 @@ def test_reverse_tiger_geometry(apiobj, frontend):
     params = {'geometry_output': napi.GeometryFormat.GEOJSON}
 
     output = api.reverse((10.0, 10.0), **params)
-    assert json.loads(output.geometry['geojson']) == {'coordinates': [10, 10.00001], 'type': 'Point'}
+    assert json.loads(output.geometry['geojson']) \
+        == {'coordinates': [10, 10.00001], 'type': 'Point'}
 
     output = api.reverse((11.0, 11.0), **params)
-    assert json.loads(output.geometry['geojson']) == {'coordinates': [11, 11.00001], 'type': 'Point'}
-
+    assert json.loads(output.geometry['geojson']) \
+        == {'coordinates': [11, 11.00001], 'type': 'Point'}
diff --git a/test/python/api/test_api_search.py b/test/python/api/test_api_search.py
index 54138e24..59a83aa9 100644
--- a/test/python/api/test_api_search.py
+++ b/test/python/api/test_api_search.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for search API calls.
@@ -10,17 +10,13 @@ Tests for search API calls.
 These tests make sure that all Python code is correct and executable.
 Functional tests can be found in the BDD test suite.
 """
-import json
-
 import pytest
 
-import sqlalchemy as sa
-
-import nominatim_api as napi
 import nominatim_api.logging as loglib
 
 API_OPTIONS = {'search'}
 
+
 @pytest.fixture(autouse=True)
 def setup_icu_tokenizer(apiobj):
     """ Setup the properties needed for using the ICU tokenizer.
@@ -28,8 +24,9 @@ def setup_icu_tokenizer(apiobj):
     apiobj.add_data('properties',
                     [{'property': 'tokenizer', 'value': 'icu'},
                      {'property': 'tokenizer_import_normalisation', 'value': ':: lower();'},
-                     {'property': 'tokenizer_import_transliteration', 'value': "'1' > '/1/'; 'Ã¤' > 'Ã¤ '"},
-                    ])
+                     {'property': 'tokenizer_import_transliteration',
+                      'value': "'1' > '/1/'; 'Ã¤' > 'Ã¤ '"},
+                     ])
 
 
 def test_search_no_content(apiobj, frontend):
@@ -64,7 +61,7 @@ def test_search_with_debug(apiobj, frontend, logtype):
 
     api = frontend(apiobj, options=API_OPTIONS)
     loglib.set_log_output(logtype)
-    results = api.search('TEST')
+    api.search('TEST')
 
     assert loglib.get_and_disable()
 
diff --git a/test/python/api/test_api_status.py b/test/python/api/test_api_status.py
index 9341b527..a80c8710 100644
--- a/test/python/api/test_api_status.py
+++ b/test/python/api/test_api_status.py
@@ -2,18 +2,17 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the status API call.
 """
 import datetime as dt
-import pytest
 
-from nominatim_db.version import NominatimVersion
 from nominatim_api.version import NOMINATIM_API_VERSION
 import nominatim_api as napi
 
+
 def test_status_no_extra_info(apiobj, frontend):
     api = frontend(apiobj)
     result = api.status()
diff --git a/test/python/api/test_api_types.py b/test/python/api/test_api_types.py
index fbb9b682..898b884d 100644
--- a/test/python/api/test_api_types.py
+++ b/test/python/api/test_api_types.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for loading of parameter dataclasses.
@@ -12,6 +12,7 @@ import pytest
 from nominatim_api.errors import UsageError
 import nominatim_api.types as typ
 
+
 def test_no_params_defaults():
     params = typ.LookupDetails.from_kwargs({})
 
@@ -24,7 +25,7 @@ def test_no_params_defaults():
                                  ('geometry_simplification', 'NaN')])
 def test_bad_format_reverse(k, v):
     with pytest.raises(UsageError):
-        params = typ.ReverseDetails.from_kwargs({k: v})
+        typ.ReverseDetails.from_kwargs({k: v})
 
 
 @pytest.mark.parametrize('rin,rout', [(-23, 0), (0, 0), (1, 1),
diff --git a/test/python/api/test_export.py b/test/python/api/test_export.py
index b0da52ce..7a4c6883 100644
--- a/test/python/api/test_export.py
+++ b/test/python/api/test_export.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for export CLI function.
@@ -11,12 +11,12 @@ import pytest
 
 import nominatim_db.cli
 
+
 @pytest.fixture
 def run_export(tmp_path, capsys):
     def _exec(args):
-        assert 0 == nominatim_db.cli.nominatim(osm2pgsql_path='OSM2PGSQL NOT AVAILABLE',
-                                               cli_args=['export', '--project-dir', str(tmp_path)]
-                                                        + args)
+        cli_args = ['export', '--project-dir', str(tmp_path)] + args
+        assert 0 == nominatim_db.cli.nominatim(cli_args=cli_args)
         return capsys.readouterr().out.split('\r\n')
 
     return _exec
@@ -25,9 +25,9 @@ def run_export(tmp_path, capsys):
 @pytest.fixture(autouse=True)
 def setup_database_with_context(apiobj):
     apiobj.add_placex(place_id=332, osm_type='W', osm_id=4,
-                     class_='highway', type='residential',  name='Street',
-                     country_code='pl', postcode='55674',
-                     rank_search=27, rank_address=26)
+                      class_='highway', type='residential',  name='Street',
+                      country_code='pl', postcode='55674',
+                      rank_search=27, rank_address=26)
     apiobj.add_address_placex(332, fromarea=False, isaddress=False,
                               distance=0.0034,
                               place_id=1000, osm_type='N', osm_id=3333,
diff --git a/test/python/api/test_helpers_v1.py b/test/python/api/test_helpers_v1.py
index 3a6a9a0b..10f0921b 100644
--- a/test/python/api/test_helpers_v1.py
+++ b/test/python/api/test_helpers_v1.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the helper functions for v1 API.
@@ -11,6 +11,7 @@ import pytest
 
 import nominatim_api.v1.helpers as helper
 
+
 @pytest.mark.parametrize('inp', ['',
                                  'abc',
                                  '12 23',
@@ -35,40 +36,42 @@ def test_extract_coords_with_text_before():
 def test_extract_coords_with_text_after():
     assert ('abc', 12.456, -78.90) == helper.extract_coords_from_query('-78.90, 12.456   abc')
 
+
 @pytest.mark.parametrize('inp', [' [12.456,-78.90] ', ' 12.456,-78.90 '])
 def test_extract_coords_with_spaces(inp):
     assert ('', -78.90, 12.456) == helper.extract_coords_from_query(inp)
 
+
 @pytest.mark.parametrize('inp', ['40 26.767 N 79 58.933 W',
-                     '40Â° 26.767â² N 79Â° 58.933â² W',
-                     "40Â° 26.767' N 79Â° 58.933' W",
-                     "40Â° 26.767'\n"
-                     "    N 79Â° 58.933' W",
-                     'N 40 26.767, W 79 58.933',
-                     'N 40Â°26.767â², W 79Â°58.933â²',
-                     '	N 40Â°26.767â², W 79Â°58.933â²',
-                     "N 40Â°26.767', W 79Â°58.933'",
- 
-                     '40 26 46 N 79 58 56 W',
-                     '40Â° 26â² 46â³ N 79Â° 58â² 56â³ W',
-                     '40Â° 26â² 46.00â³ N 79Â° 58â² 56.00â³ W',
-                     '40Â°26â²46â³N 79Â°58â²56â³W',
-                     'N 40 26 46 W 79 58 56',
-                     'N 40Â° 26â² 46â³, W 79Â° 58â² 56â³',
-                     'N 40Â° 26\' 46", W 79Â° 58\' 56"',
-                     'N 40Â° 26\' 46", W 79Â° 58\' 56"',
- 
-                     '40.446 -79.982',
-                     '40.446,-79.982',
-                     '40.446Â° N 79.982Â° W',
-                     'N 40.446Â° W 79.982Â°',
- 
-                     '[40.446 -79.982]',
-                     '[40.446,-79.982]',
-                     '       40.446  ,   -79.982     ',
-                     '       40.446  ,   -79.982     ',
-                     '       40.446	,   -79.982	',
-                     '       40.446,   -79.982	'])
+                                 '40Â° 26.767â² N 79Â° 58.933â² W',
+                                 "40Â° 26.767' N 79Â° 58.933' W",
+                                 "40Â° 26.767'\n"
+                                 "    N 79Â° 58.933' W",
+                                 'N 40 26.767, W 79 58.933',
+                                 'N 40Â°26.767â², W 79Â°58.933â²',
+                                 '	N 40Â°26.767â², W 79Â°58.933â²',
+                                 "N 40Â°26.767', W 79Â°58.933'",
+
+                                 '40 26 46 N 79 58 56 W',
+                                 '40Â° 26â² 46â³ N 79Â° 58â² 56â³ W',
+                                 '40Â° 26â² 46.00â³ N 79Â° 58â² 56.00â³ W',
+                                 '40Â°26â²46â³N 79Â°58â²56â³W',
+                                 'N 40 26 46 W 79 58 56',
+                                 'N 40Â° 26â² 46â³, W 79Â° 58â² 56â³',
+                                 'N 40Â° 26\' 46", W 79Â° 58\' 56"',
+                                 'N 40Â° 26\' 46", W 79Â° 58\' 56"',
+
+                                 '40.446 -79.982',
+                                 '40.446,-79.982',
+                                 '40.446Â° N 79.982Â° W',
+                                 'N 40.446Â° W 79.982Â°',
+
+                                 '[40.446 -79.982]',
+                                 '[40.446,-79.982]',
+                                 '       40.446  ,   -79.982     ',
+                                 '       40.446  ,   -79.982     ',
+                                 '       40.446	,   -79.982	',
+                                 '       40.446,   -79.982	'])
 def test_extract_coords_formats(inp):
     query, x, y = helper.extract_coords_from_query(inp)
 
@@ -108,9 +111,11 @@ def test_extract_category_good(inp):
     assert cls == 'shop'
     assert typ == 'fish'
 
+
 def test_extract_category_only():
     assert helper.extract_category_from_query('[shop=market]') == ('', 'shop', 'market')
 
+
 @pytest.mark.parametrize('inp', ['house []', 'nothing', '[352]'])
-def  test_extract_category_no_match(inp):
+def test_extract_category_no_match(inp):
     assert helper.extract_category_from_query(inp) == (inp, None, None)
diff --git a/test/python/api/test_localization.py b/test/python/api/test_localization.py
index 21fa72c8..c3e02596 100644
--- a/test/python/api/test_localization.py
+++ b/test/python/api/test_localization.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Test functions for adapting results to the user's locale.
@@ -11,34 +11,232 @@ import pytest
 
 from nominatim_api import Locales
 
+
 def test_display_name_empty_names():
-    l = Locales(['en', 'de'])
+    loc = Locales(['en', 'de'])
+
+    assert loc.display_name(None) == ''
+    assert loc.display_name({}) == ''
 
-    assert l.display_name(None) == ''
-    assert l.display_name({}) == ''
 
 def test_display_name_none_localized():
-    l = Locales()
+    loc = Locales()
+
+    assert loc.display_name({}) == ''
+    assert loc.display_name({'name:de': 'DE', 'name': 'ALL'}) == 'ALL'
+    assert loc.display_name({'ref': '34', 'name:de': 'DE'}) == '34'
+
+
+def test_output_names_none_localized():
+    loc = Locales()
+
+    expected_tags = [
+        'name', '_place_name', 'brand', '_place_brand', 'official_name', '_place_official_name',
+        'short_name', '_place_short_name', 'ref', '_place_ref'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_none_localized_and_custom_output_names(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name:XX,entrance:XX,name,brand,test_tag,'
+        'official_name:XX,short_name:XX,alt_name:XX'
+    )
+    loc = Locales()
+
+    expected_tags = [
+        'name', '_place_name', 'brand', '_place_brand', 'test_tag', '_place_test_tag'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_none_localized_and_custom_output_names_more_than_two_changes(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name:XX,brand,test_tag:XX,official_name,short_name:XX,'
+        'alt_name,another_tag_with:XX,another_tag_withoutXX'
+    )
+    loc = Locales()
 
-    assert l.display_name({}) == ''
-    assert l.display_name({'name:de': 'DE', 'name': 'ALL'}) == 'ALL'
-    assert l.display_name({'ref': '34', 'name:de': 'DE'}) == '34'
+    expected_tags = [
+        'brand', '_place_brand', 'official_name', '_place_official_name', 'alt_name',
+        '_place_alt_name', 'another_tag_withoutXX', '_place_another_tag_withoutXX'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_none_localized_and_custom_output_names_including_space(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name:XX,name ,short_name:XX, short_name'
+    )
+    loc = Locales()
+
+    expected_tags = [
+        'name', '_place_name', 'short_name', '_place_short_name'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
 
 
 def test_display_name_localized():
-    l = Locales(['en', 'de'])
+    loc = Locales(['en', 'de'])
+
+    assert loc.display_name({}) == ''
+    assert loc.display_name({'name:de': 'DE', 'name': 'ALL'}) == 'DE'
+    assert loc.display_name({'ref': '34', 'name:de': 'DE'}) == 'DE'
+
+
+def test_output_names_localized():
+    loc = Locales(['en', 'es'])
+
+    expected_tags = [
+        'name:en', '_place_name:en', 'name:es', '_place_name:es', 'name', '_place_name', 'brand',
+        '_place_brand', 'official_name:en', '_place_official_name:en', 'official_name:es',
+        '_place_official_name:es', 'short_name:en', '_place_short_name:en', 'short_name:es',
+        '_place_short_name:es', 'official_name', '_place_official_name', 'short_name',
+        '_place_short_name', 'ref', '_place_ref'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_localized_and_custom_output_names_including_space(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name:XX,name ,short_name:XX, short_name'
+    )
+    loc = Locales(['en', 'es'])
+
+    expected_tags = [
+        'name:en', '_place_name:en', 'name:es', '_place_name:es',
+        'name', '_place_name',
+        'short_name:en', '_place_short_name:en', 'short_name:es', '_place_short_name:es',
+        'short_name', '_place_short_name'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_localized_and_custom_output_names(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name:XX,entrance:XX,name,brand,test_tag,official_name:XX,short_name:XX,alt_name:XX'
+    )
+    loc = Locales(['en', 'es'])
+
+    expected_tags = [
+        'name:en', '_place_name:en', 'name:es', '_place_name:es', 'entrance:en',
+        '_place_entrance:en', 'entrance:es', '_place_entrance:es', 'name', '_place_name',
+        'brand', '_place_brand', 'test_tag', '_place_test_tag', 'official_name:en',
+        '_place_official_name:en', 'official_name:es', '_place_official_name:es',
+        'short_name:en', '_place_short_name:en', 'short_name:es', '_place_short_name:es',
+        'alt_name:en', '_place_alt_name:en', 'alt_name:es', '_place_alt_name:es'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_localized_and_custom_output_names_start_with_tag_that_has_no_XX(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name,brand,test_tag,official_name:XX,short_name:XX,alt_name:XX'
+    )
+    loc = Locales(['en', 'es'])
+
+    expected_tags = [
+        'name', '_place_name', 'brand', '_place_brand', 'test_tag', '_place_test_tag',
+        'official_name:en', '_place_official_name:en', 'official_name:es',
+        '_place_official_name:es', 'short_name:en', '_place_short_name:en', 'short_name:es',
+        '_place_short_name:es', 'alt_name:en', '_place_alt_name:en', 'alt_name:es',
+        '_place_alt_name:es'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_localized_and_custom_output_names_no_named_tags(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name,brand,test_tag'
+    )
+    loc = Locales(['en', 'es'])
+
+    expected_tags = [
+        'name', '_place_name', 'brand', '_place_brand', 'test_tag', '_place_test_tag'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_localized_and_custom_output_names_only_named_tags(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name:XX,entrance:XX,official_name:XX,short_name:XX,alt_name:XX'
+    )
+    loc = Locales(['en', 'es'])
+
+    expected_tags = [
+        'name:en', '_place_name:en', 'name:es', '_place_name:es', 'entrance:en',
+        '_place_entrance:en', 'entrance:es', '_place_entrance:es', 'official_name:en',
+        '_place_official_name:en', 'official_name:es', '_place_official_name:es',
+        'short_name:en', '_place_short_name:en', 'short_name:es', '_place_short_name:es',
+        'alt_name:en', '_place_alt_name:en', 'alt_name:es', '_place_alt_name:es'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_localized_and_custom_output_names_more_than_two_changes(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name:XX,brand,test_tag:XX,official_name,short_name:XX,'
+        'alt_name,another_tag_with:XX,another_tag_withoutXX'
+    )
+    loc = Locales(['en', 'es'])
+
+    expected_tags = [
+        'name:en', '_place_name:en', 'name:es', '_place_name:es', 'brand', '_place_brand',
+        'test_tag:en', '_place_test_tag:en', 'test_tag:es', '_place_test_tag:es', 'official_name',
+        '_place_official_name', 'short_name:en', '_place_short_name:en', 'short_name:es',
+        '_place_short_name:es', 'alt_name', '_place_alt_name', 'another_tag_with:en',
+        '_place_another_tag_with:en', 'another_tag_with:es', '_place_another_tag_with:es',
+        'another_tag_withoutXX', '_place_another_tag_withoutXX'
+    ]
+
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
+
+
+def test_output_names_localized_and_custom_output_names_XX_in_the_middle(monkeypatch):
+    monkeypatch.setenv(
+        'NOMINATIM_OUTPUT_NAMES',
+        'name:XX,br:XXand,test_tag:XX,official_name,sh:XXort_name:XX,'
+        'alt_name,another_tag_with:XX,another_tag_withoutXX'
+    )
+    loc = Locales(['en', 'es'])
+
+    expected_tags = [
+        'name:en', '_place_name:en', 'name:es', '_place_name:es', 'br:XXand', '_place_br:XXand',
+        'test_tag:en', '_place_test_tag:en', 'test_tag:es', '_place_test_tag:es', 'official_name',
+        '_place_official_name', 'sh:XXort_name:en', '_place_sh:XXort_name:en', 'sh:XXort_name:es',
+        '_place_sh:XXort_name:es', 'alt_name', '_place_alt_name', 'another_tag_with:en',
+        '_place_another_tag_with:en', 'another_tag_with:es', '_place_another_tag_with:es',
+        'another_tag_withoutXX', '_place_another_tag_withoutXX'
+    ]
 
-    assert l.display_name({}) == ''
-    assert l.display_name({'name:de': 'DE', 'name': 'ALL'}) == 'DE'
-    assert l.display_name({'ref': '34', 'name:de': 'DE'}) == 'DE'
+    assert loc.name_tags == expected_tags, f'Expected {expected_tags}, but got {loc.name_tags}'
 
 
 def test_display_name_preference():
-    l = Locales(['en', 'de'])
+    loc = Locales(['en', 'de'])
 
-    assert l.display_name({}) == ''
-    assert l.display_name({'name:de': 'DE', 'name:en': 'EN'}) == 'EN'
-    assert l.display_name({'official_name:en': 'EN', 'name:de': 'DE'}) == 'DE'
+    assert loc.display_name({}) == ''
+    assert loc.display_name({'name:de': 'DE', 'name:en': 'EN'}) == 'EN'
+    assert loc.display_name({'official_name:en': 'EN', 'name:de': 'DE'}) == 'DE'
 
 
 @pytest.mark.parametrize('langstr,langlist',
diff --git a/test/python/api/test_result_formatting_v1.py b/test/python/api/test_result_formatting_v1.py
index aaecab45..406c7654 100644
--- a/test/python/api/test_result_formatting_v1.py
+++ b/test/python/api/test_result_formatting_v1.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for formatting results for the V1 API.
@@ -22,6 +22,7 @@ STATUS_FORMATS = {'text', 'json'}
 
 # StatusResult
 
+
 def test_status_format_list():
     assert set(v1_format.list_formats(napi.StatusResult)) == STATUS_FORMATS
 
@@ -36,11 +37,13 @@ def test_status_unsupported():
 
 
 def test_status_format_text():
-    assert v1_format.format_result(napi.StatusResult(0, 'message here'), 'text', {}) == 'OK'
+    assert v1_format.format_result(napi.StatusResult(0, 'message here'), 'text', {}) \
+        == 'OK'
 
 
-def test_status_format_text():
-    assert v1_format.format_result(napi.StatusResult(500, 'message here'), 'text', {}) == 'ERROR: message here'
+def test_status_format_error_text():
+    assert v1_format.format_result(napi.StatusResult(500, 'message here'), 'text', {}) \
+        == 'ERROR: message here'
 
 
 def test_status_format_json_minimal():
@@ -48,8 +51,9 @@ def test_status_format_json_minimal():
 
     result = v1_format.format_result(status, 'json', {})
 
-    assert result == \
-           f'{{"status":700,"message":"Bad format.","software_version":"{napi.__version__}"}}'
+    assert json.loads(result) == {'status': 700,
+                                  'message': 'Bad format.',
+                                  'software_version': napi.__version__}
 
 
 def test_status_format_json_full():
@@ -59,8 +63,11 @@ def test_status_format_json_full():
 
     result = v1_format.format_result(status, 'json', {})
 
-    assert result == \
-           f'{{"status":0,"message":"OK","data_updated":"2010-02-07T20:20:03+00:00","software_version":"{napi.__version__}","database_version":"5.6"}}'
+    assert json.loads(result) == {'status': 0,
+                                  'message': 'OK',
+                                  'data_updated': '2010-02-07T20:20:03+00:00',
+                                  'software_version': napi.__version__,
+                                  'database_version': '5.6'}
 
 
 # DetailedResult
@@ -86,7 +93,7 @@ def test_search_details_minimal():
             'extratags': {},
             'centroid': {'type': 'Point', 'coordinates': [1.0, 2.0]},
             'geometry': {'type': 'Point', 'coordinates': [1.0, 2.0]},
-           }
+            }
 
 
 def test_search_details_full():
@@ -110,7 +117,7 @@ def test_search_details_full():
                   rank_search=28,
                   importance=0.0443,
                   country_code='ll',
-                  indexed_date = import_date
+                  indexed_date=import_date
                   )
     search.localize(napi.Locales())
 
@@ -140,7 +147,7 @@ def test_search_details_full():
             'isarea': False,
             'centroid': {'type': 'Point', 'coordinates': [56.947, -87.44]},
             'geometry': {'type': 'Point', 'coordinates': [56.947, -87.44]},
-           }
+            }
 
 
 @pytest.mark.parametrize('gtype,isarea', [('ST_Point', False),
@@ -149,9 +156,9 @@ def test_search_details_full():
                                           ('ST_MultiPolygon', True)])
 def test_search_details_no_geometry(gtype, isarea):
     search = napi.DetailedResult(napi.SourceTable.PLACEX,
-                               ('place', 'thing'),
-                               napi.Point(1.0, 2.0),
-                               geometry={'type': gtype})
+                                 ('place', 'thing'),
+                                 napi.Point(1.0, 2.0),
+                                 geometry={'type': gtype})
 
     result = v1_format.format_result(search, 'json', {})
     js = json.loads(result)
@@ -161,16 +168,17 @@ def test_search_details_no_geometry(gtype, isarea):
 
 
 def test_search_details_with_geometry():
-    search = napi.DetailedResult(napi.SourceTable.PLACEX,
-                                 ('place', 'thing'),
-                                 napi.Point(1.0, 2.0),
-                                 geometry={'geojson': '{"type":"Point","coordinates":[56.947,-87.44]}'})
+    search = napi.DetailedResult(
+        napi.SourceTable.PLACEX,
+        ('place', 'thing'),
+        napi.Point(1.0, 2.0),
+        geometry={'geojson': '{"type":"Point","coordinates":[56.947,-87.44]}'})
 
     result = v1_format.format_result(search, 'json', {})
     js = json.loads(result)
 
     assert js['geometry'] == {'type': 'Point', 'coordinates': [56.947, -87.44]}
-    assert js['isarea'] == False
+    assert js['isarea'] is False
 
 
 def test_search_details_with_icon_available():
@@ -226,7 +234,7 @@ def test_search_details_with_address_minimal():
 @pytest.mark.parametrize('field,outfield', [('address_rows', 'address'),
                                             ('linked_rows', 'linked_places'),
                                             ('parented_rows', 'hierarchy')
-                                           ])
+                                            ])
 def test_search_details_with_further_infos(field, outfield):
     search = napi.DetailedResult(napi.SourceTable.PLACEX,
                                  ('place', 'thing'),
@@ -249,50 +257,49 @@ def test_search_details_with_further_infos(field, outfield):
     js = json.loads(result)
 
     assert js[outfield] == [{'localname': 'Trespass',
-                              'place_id': 3498,
-                              'osm_id': 442,
-                              'osm_type': 'R',
-                              'place_type': 'spec',
-                              'class': 'bnd',
-                              'type': 'note',
-                              'admin_level': 4,
-                              'rank_address': 10,
-                              'distance': 0.034,
-                              'isaddress': True}]
+                             'place_id': 3498,
+                             'osm_id': 442,
+                             'osm_type': 'R',
+                             'place_type': 'spec',
+                             'class': 'bnd',
+                             'type': 'note',
+                             'admin_level': 4,
+                             'rank_address': 10,
+                             'distance': 0.034,
+                             'isaddress': True}]
 
 
 def test_search_details_grouped_hierarchy():
     search = napi.DetailedResult(napi.SourceTable.PLACEX,
                                  ('place', 'thing'),
                                  napi.Point(1.0, 2.0),
-                                 parented_rows =
-                                     [napi.AddressLine(place_id=3498,
-                                             osm_object=('R', 442),
-                                             category=('bnd', 'note'),
-                                             names={'name': 'Trespass'},
-                                             extratags={'access': 'no',
-                                                        'place_type': 'spec'},
-                                             admin_level=4,
-                                             fromarea=True,
-                                             isaddress=True,
-                                             rank_address=10,
-                                             distance=0.034)
-                                     ])
+                                 parented_rows=[napi.AddressLine(
+                                    place_id=3498,
+                                    osm_object=('R', 442),
+                                    category=('bnd', 'note'),
+                                    names={'name': 'Trespass'},
+                                    extratags={'access': 'no',
+                                               'place_type': 'spec'},
+                                    admin_level=4,
+                                    fromarea=True,
+                                    isaddress=True,
+                                    rank_address=10,
+                                    distance=0.034)])
 
     result = v1_format.format_result(search, 'json', {'group_hierarchy': True})
     js = json.loads(result)
 
     assert js['hierarchy'] == {'note': [{'localname': 'Trespass',
-                              'place_id': 3498,
-                              'osm_id': 442,
-                              'osm_type': 'R',
-                              'place_type': 'spec',
-                              'class': 'bnd',
-                              'type': 'note',
-                              'admin_level': 4,
-                              'rank_address': 10,
-                              'distance': 0.034,
-                              'isaddress': True}]}
+                                         'place_id': 3498,
+                                         'osm_id': 442,
+                                         'osm_type': 'R',
+                                         'place_type': 'spec',
+                                         'class': 'bnd',
+                                         'type': 'note',
+                                         'admin_level': 4,
+                                         'rank_address': 10,
+                                         'distance': 0.034,
+                                         'isaddress': True}]}
 
 
 def test_search_details_keywords_name():
@@ -307,7 +314,7 @@ def test_search_details_keywords_name():
     js = json.loads(result)
 
     assert js['keywords'] == {'name': [{'id': 23, 'token': 'foo'},
-                                      {'id': 24, 'token': 'foo'}],
+                                       {'id': 24, 'token': 'foo'}],
                               'address': []}
 
 
@@ -323,6 +330,5 @@ def test_search_details_keywords_address():
     js = json.loads(result)
 
     assert js['keywords'] == {'address': [{'id': 23, 'token': 'foo'},
-                                      {'id': 24, 'token': 'foo'}],
+                                          {'id': 24, 'token': 'foo'}],
                               'name': []}
-
diff --git a/test/python/api/test_result_formatting_v1_reverse.py b/test/python/api/test_result_formatting_v1_reverse.py
index 2c036a65..902f0e79 100644
--- a/test/python/api/test_result_formatting_v1_reverse.py
+++ b/test/python/api/test_result_formatting_v1_reverse.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for formatting reverse results for the V1 API.
@@ -20,6 +20,7 @@ import nominatim_api as napi
 
 FORMATS = ['json', 'jsonv2', 'geojson', 'geocodejson', 'xml']
 
+
 @pytest.mark.parametrize('fmt', FORMATS)
 def test_format_reverse_minimal(fmt):
     reverse = napi.ReverseResult(napi.SourceTable.PLACEX,
@@ -104,8 +105,7 @@ def test_format_reverse_with_address(fmt):
     reverse.localize(napi.Locales())
 
     raw = v1_format.format_result(napi.ReverseResults([reverse]), fmt,
-                                 {'addressdetails': True})
-
+                                  {'addressdetails': True})
 
     if fmt == 'xml':
         root = ET.fromstring(raw)
@@ -168,7 +168,7 @@ def test_format_reverse_geocodejson_special_parts():
     reverse.localize(napi.Locales())
 
     raw = v1_format.format_result(napi.ReverseResults([reverse]), 'geocodejson',
-                                 {'addressdetails': True})
+                                  {'addressdetails': True})
 
     props = json.loads(raw)['features'][0]['properties']['geocoding']
     assert props['housenumber'] == '1'
@@ -184,8 +184,7 @@ def test_format_reverse_with_address_none(fmt):
                                  address_rows=napi.AddressLines())
 
     raw = v1_format.format_result(napi.ReverseResults([reverse]), fmt,
-                                 {'addressdetails': True})
-
+                                  {'addressdetails': True})
 
     if fmt == 'xml':
         root = ET.fromstring(raw)
@@ -211,10 +210,10 @@ def test_format_reverse_with_extratags(fmt):
     reverse = napi.ReverseResult(napi.SourceTable.PLACEX,
                                  ('place', 'thing'),
                                  napi.Point(1.0, 2.0),
-                                 extratags={'one': 'A', 'two':'B'})
+                                 extratags={'one': 'A', 'two': 'B'})
 
     raw = v1_format.format_result(napi.ReverseResults([reverse]), fmt,
-                                 {'extratags': True})
+                                  {'extratags': True})
 
     if fmt == 'xml':
         root = ET.fromstring(raw)
@@ -226,7 +225,7 @@ def test_format_reverse_with_extratags(fmt):
         else:
             extra = result['extratags']
 
-        assert extra == {'one': 'A', 'two':'B'}
+        assert extra == {'one': 'A', 'two': 'B'}
 
 
 @pytest.mark.parametrize('fmt', ['json', 'jsonv2', 'geojson', 'xml'])
@@ -236,7 +235,7 @@ def test_format_reverse_with_extratags_none(fmt):
                                  napi.Point(1.0, 2.0))
 
     raw = v1_format.format_result(napi.ReverseResults([reverse]), fmt,
-                                 {'extratags': True})
+                                  {'extratags': True})
 
     if fmt == 'xml':
         root = ET.fromstring(raw)
@@ -256,10 +255,10 @@ def test_format_reverse_with_namedetails_with_name(fmt):
     reverse = napi.ReverseResult(napi.SourceTable.PLACEX,
                                  ('place', 'thing'),
                                  napi.Point(1.0, 2.0),
-                                 names={'name': 'A', 'ref':'1'})
+                                 names={'name': 'A', 'ref': '1'})
 
     raw = v1_format.format_result(napi.ReverseResults([reverse]), fmt,
-                                 {'namedetails': True})
+                                  {'namedetails': True})
 
     if fmt == 'xml':
         root = ET.fromstring(raw)
@@ -271,7 +270,7 @@ def test_format_reverse_with_namedetails_with_name(fmt):
         else:
             extra = result['namedetails']
 
-        assert extra == {'name': 'A', 'ref':'1'}
+        assert extra == {'name': 'A', 'ref': '1'}
 
 
 @pytest.mark.parametrize('fmt', ['json', 'jsonv2', 'geojson', 'xml'])
@@ -281,7 +280,7 @@ def test_format_reverse_with_namedetails_without_name(fmt):
                                  napi.Point(1.0, 2.0))
 
     raw = v1_format.format_result(napi.ReverseResults([reverse]), fmt,
-                                 {'namedetails': True})
+                                  {'namedetails': True})
 
     if fmt == 'xml':
         root = ET.fromstring(raw)
@@ -303,7 +302,7 @@ def test_search_details_with_icon_available(fmt):
                                  napi.Point(1.0, 2.0))
 
     result = v1_format.format_result(napi.ReverseResults([reverse]), fmt,
-                                    {'icon_base_url': 'foo'})
+                                     {'icon_base_url': 'foo'})
 
     js = json.loads(result)
 
@@ -317,7 +316,6 @@ def test_search_details_with_icon_not_available(fmt):
                                  napi.Point(1.0, 2.0))
 
     result = v1_format.format_result(napi.ReverseResults([reverse]), fmt,
-                                    {'icon_base_url': 'foo'})
+                                     {'icon_base_url': 'foo'})
 
     assert 'icon' not in json.loads(result)
-
diff --git a/test/python/api/test_results.py b/test/python/api/test_results.py
index f0bfa163..8e9fbf68 100644
--- a/test/python/api/test_results.py
+++ b/test/python/api/test_results.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for result datatype helper functions.
@@ -11,16 +11,15 @@ import struct
 from binascii import hexlify
 
 import pytest
-import pytest_asyncio
-import sqlalchemy as sa
-
 
 from nominatim_api import SourceTable, DetailedResult, Point
 import nominatim_api.results as nresults
 
+
 def mkpoint(x, y):
     return hexlify(struct.pack("=biidd", 1, 0x20000001, 4326, x, y)).decode('utf-8')
 
+
 class FakeRow:
     def __init__(self, **kwargs):
         if 'parent_place_id' not in kwargs:
@@ -39,6 +38,7 @@ def test_minimal_detailed_result():
     assert res.lat == 0.5
     assert res.calculated_importance() == pytest.approx(0.00001)
 
+
 def test_detailed_result_custom_importance():
     res = DetailedResult(SourceTable.PLACEX,
                          ('amenity', 'post_box'),
diff --git a/test/python/api/test_server_glue_v1.py b/test/python/api/test_server_glue_v1.py
index 6ea790c0..8d9f0940 100644
--- a/test/python/api/test_server_glue_v1.py
+++ b/test/python/api/test_server_glue_v1.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the Python web frameworks adaptor, v1 API.
@@ -121,7 +121,6 @@ class TestAdaptorRaiseError:
 
         return excinfo.value
 
-
     def test_without_content_set(self):
         err = self.run_raise_error('TEST', 404)
 
@@ -129,7 +128,6 @@ class TestAdaptorRaiseError:
         assert err.msg == 'ERROR 404: TEST'
         assert err.status == 404
 
-
     def test_json(self):
         self.adaptor.content_type = 'application/json; charset=utf-8'
 
@@ -139,7 +137,6 @@ class TestAdaptorRaiseError:
         assert content['code'] == 501
         assert content['message'] == 'TEST'
 
-
     def test_xml(self):
         self.adaptor.content_type = 'text/xml; charset=utf-8'
 
@@ -235,7 +232,6 @@ class TestStatusEndpoint:
 
         monkeypatch.setattr(napi.NominatimAPIAsync, 'status', _status)
 
-
     @pytest.mark.asyncio
     async def test_status_without_params(self):
         a = FakeAdaptor()
@@ -247,7 +243,6 @@ class TestStatusEndpoint:
         assert resp.status == 200
         assert resp.content_type == 'text/plain; charset=utf-8'
 
-
     @pytest.mark.asyncio
     async def test_status_with_error(self):
         a = FakeAdaptor()
@@ -259,7 +254,6 @@ class TestStatusEndpoint:
         assert resp.status == 500
         assert resp.content_type == 'text/plain; charset=utf-8'
 
-
     @pytest.mark.asyncio
     async def test_status_json_with_error(self):
         a = FakeAdaptor(params={'format': 'json'})
@@ -271,7 +265,6 @@ class TestStatusEndpoint:
         assert resp.status == 200
         assert resp.content_type == 'application/json; charset=utf-8'
 
-
     @pytest.mark.asyncio
     async def test_status_bad_format(self):
         a = FakeAdaptor(params={'format': 'foo'})
@@ -298,7 +291,6 @@ class TestDetailsEndpoint:
 
         monkeypatch.setattr(napi.NominatimAPIAsync, 'details', _lookup)
 
-
     @pytest.mark.asyncio
     async def test_details_no_params(self):
         a = FakeAdaptor()
@@ -306,7 +298,6 @@ class TestDetailsEndpoint:
         with pytest.raises(FakeError, match='^400 -- .*Missing'):
             await glue.details_endpoint(napi.NominatimAPIAsync(), a)
 
-
     @pytest.mark.asyncio
     async def test_details_by_place_id(self):
         a = FakeAdaptor(params={'place_id': '4573'})
@@ -315,7 +306,6 @@ class TestDetailsEndpoint:
 
         assert self.lookup_args[0].place_id == 4573
 
-
     @pytest.mark.asyncio
     async def test_details_by_osm_id(self):
         a = FakeAdaptor(params={'osmtype': 'N', 'osmid': '45'})
@@ -326,7 +316,6 @@ class TestDetailsEndpoint:
         assert self.lookup_args[0].osm_id == 45
         assert self.lookup_args[0].osm_class is None
 
-
     @pytest.mark.asyncio
     async def test_details_with_debugging(self):
         a = FakeAdaptor(params={'osmtype': 'N', 'osmid': '45', 'debug': '1'})
@@ -337,7 +326,6 @@ class TestDetailsEndpoint:
         assert resp.content_type == 'text/html; charset=utf-8'
         assert content.tag == 'html'
 
-
     @pytest.mark.asyncio
     async def test_details_no_result(self):
         a = FakeAdaptor(params={'place_id': '4573'})
@@ -353,14 +341,14 @@ class TestReverseEndPoint:
     @pytest.fixture(autouse=True)
     def patch_reverse_func(self, monkeypatch):
         self.result = napi.ReverseResult(napi.SourceTable.PLACEX,
-                                          ('place', 'thing'),
-                                          napi.Point(1.0, 2.0))
+                                         ('place', 'thing'),
+                                         napi.Point(1.0, 2.0))
+
         async def _reverse(*args, **kwargs):
             return self.result
 
         monkeypatch.setattr(napi.NominatimAPIAsync, 'reverse', _reverse)
 
-
     @pytest.mark.asyncio
     @pytest.mark.parametrize('params', [{}, {'lat': '3.4'}, {'lon': '6.7'}])
     async def test_reverse_no_params(self, params):
@@ -371,19 +359,6 @@ class TestReverseEndPoint:
         with pytest.raises(FakeError, match='^400 -- (?s:.*)missing'):
             await glue.reverse_endpoint(napi.NominatimAPIAsync(), a)
 
-
-    @pytest.mark.asyncio
-    @pytest.mark.parametrize('params', [{'lat': '45.6', 'lon': '4563'}])
-    async def test_reverse_success(self, params):
-        a = FakeAdaptor()
-        a.params = params
-        a.params['format'] = 'json'
-
-        res = await glue.reverse_endpoint(napi.NominatimAPIAsync(), a)
-
-        assert res == ''
-
-
     @pytest.mark.asyncio
     async def test_reverse_success(self):
         a = FakeAdaptor()
@@ -392,7 +367,6 @@ class TestReverseEndPoint:
 
         assert await glue.reverse_endpoint(napi.NominatimAPIAsync(), a)
 
-
     @pytest.mark.asyncio
     async def test_reverse_from_search(self):
         a = FakeAdaptor()
@@ -413,12 +387,12 @@ class TestLookupEndpoint:
         self.results = [napi.SearchResult(napi.SourceTable.PLACEX,
                                           ('place', 'thing'),
                                           napi.Point(1.0, 2.0))]
+
         async def _lookup(*args, **kwargs):
             return napi.SearchResults(self.results)
 
         monkeypatch.setattr(napi.NominatimAPIAsync, 'lookup', _lookup)
 
-
     @pytest.mark.asyncio
     async def test_lookup_no_params(self):
         a = FakeAdaptor()
@@ -428,7 +402,6 @@ class TestLookupEndpoint:
 
         assert res.output == '[]'
 
-
     @pytest.mark.asyncio
     @pytest.mark.parametrize('param', ['w', 'bad', ''])
     async def test_lookup_bad_params(self, param):
@@ -440,7 +413,6 @@ class TestLookupEndpoint:
 
         assert len(json.loads(res.output)) == 1
 
-
     @pytest.mark.asyncio
     @pytest.mark.parametrize('param', ['p234234', '4563'])
     async def test_lookup_bad_osm_type(self, param):
@@ -452,7 +424,6 @@ class TestLookupEndpoint:
 
         assert len(json.loads(res.output)) == 1
 
-
     @pytest.mark.asyncio
     async def test_lookup_working(self):
         a = FakeAdaptor()
@@ -473,12 +444,12 @@ class TestSearchEndPointSearch:
         self.results = [napi.SearchResult(napi.SourceTable.PLACEX,
                                           ('place', 'thing'),
                                           napi.Point(1.0, 2.0))]
+
         async def _search(*args, **kwargs):
             return napi.SearchResults(self.results)
 
         monkeypatch.setattr(napi.NominatimAPIAsync, 'search', _search)
 
-
     @pytest.mark.asyncio
     async def test_search_free_text(self):
         a = FakeAdaptor()
@@ -488,7 +459,6 @@ class TestSearchEndPointSearch:
 
         assert len(json.loads(res.output)) == 1
 
-
     @pytest.mark.asyncio
     async def test_search_free_text_xml(self):
         a = FakeAdaptor()
@@ -500,7 +470,6 @@ class TestSearchEndPointSearch:
         assert res.status == 200
         assert res.output.index('something') > 0
 
-
     @pytest.mark.asyncio
     async def test_search_free_and_structured(self):
         a = FakeAdaptor()
@@ -508,8 +477,7 @@ class TestSearchEndPointSearch:
         a.params['city'] = 'ignored'
 
         with pytest.raises(FakeError, match='^400 -- .*cannot be used together'):
-            res = await glue.search_endpoint(napi.NominatimAPIAsync(), a)
-
+            await glue.search_endpoint(napi.NominatimAPIAsync(), a)
 
     @pytest.mark.asyncio
     @pytest.mark.parametrize('dedupe,numres', [(True, 1), (False, 2)])
@@ -532,12 +500,12 @@ class TestSearchEndPointSearchAddress:
         self.results = [napi.SearchResult(napi.SourceTable.PLACEX,
                                           ('place', 'thing'),
                                           napi.Point(1.0, 2.0))]
+
         async def _search(*args, **kwargs):
             return napi.SearchResults(self.results)
 
         monkeypatch.setattr(napi.NominatimAPIAsync, 'search_address', _search)
 
-
     @pytest.mark.asyncio
     async def test_search_structured(self):
         a = FakeAdaptor()
@@ -555,12 +523,12 @@ class TestSearchEndPointSearchCategory:
         self.results = [napi.SearchResult(napi.SourceTable.PLACEX,
                                           ('place', 'thing'),
                                           napi.Point(1.0, 2.0))]
+
         async def _search(*args, **kwargs):
             return napi.SearchResults(self.results)
 
         monkeypatch.setattr(napi.NominatimAPIAsync, 'search_category', _search)
 
-
     @pytest.mark.asyncio
     async def test_search_category(self):
         a = FakeAdaptor()
diff --git a/test/python/api/test_warm.py b/test/python/api/test_warm.py
index f0c9986d..02ca0766 100644
--- a/test/python/api/test_warm.py
+++ b/test/python/api/test_warm.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for warm-up CLI function.
@@ -11,6 +11,7 @@ import pytest
 
 import nominatim_db.cli
 
+
 @pytest.fixture(autouse=True)
 def setup_database_with_context(apiobj, table_factory):
     table_factory('word',
@@ -21,12 +22,12 @@ def setup_database_with_context(apiobj, table_factory):
     apiobj.add_data('properties',
                     [{'property': 'tokenizer', 'value': 'icu'},
                      {'property': 'tokenizer_import_normalisation', 'value': ':: lower();'},
-                     {'property': 'tokenizer_import_transliteration', 'value': "'1' > '/1/'; 'Ã¤' > 'Ã¤ '"},
-                    ])
+                     {'property': 'tokenizer_import_transliteration',
+                      'value': "'1' > '/1/'; 'Ã¤' > 'Ã¤ '"}
+                     ])
 
 
 @pytest.mark.parametrize('args', [['--search-only'], ['--reverse-only']])
 def test_warm_all(tmp_path, args):
-    assert 0 == nominatim_db.cli.nominatim(osm2pgsql_path='OSM2PGSQL NOT AVAILABLE',
-                                           cli_args=['admin', '--project-dir', str(tmp_path),
+    assert 0 == nominatim_db.cli.nominatim(cli_args=['admin', '--project-dir', str(tmp_path),
                                                      '--warm'] + args)
diff --git a/test/python/cli/conftest.py b/test/python/cli/conftest.py
index 84f2d659..0c61b29e 100644
--- a/test/python/cli/conftest.py
+++ b/test/python/cli/conftest.py
@@ -2,12 +2,13 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 import pytest
 
 import nominatim_db.cli
 
+
 class MockParamCapture:
     """ Mock that records the parameters with which a function was called
         as well as the number of calls.
@@ -68,8 +69,7 @@ def cli_call():
         Returns a function that can be called with the desired CLI arguments.
     """
     def _call_nominatim(*args):
-        return nominatim_db.cli.nominatim(osm2pgsql_path='OSM2PGSQL NOT AVAILABLE',
-                                          cli_args=args)
+        return nominatim_db.cli.nominatim(cli_args=args)
 
     return _call_nominatim
 
diff --git a/test/python/cli/test_cli.py b/test/python/cli/test_cli.py
index d42df50a..a538049e 100644
--- a/test/python/cli/test_cli.py
+++ b/test/python/cli/test_cli.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for command line interface wrapper.
@@ -11,7 +11,6 @@ These tests just check that the various command line parameters route to the
 correct functionality. They use a lot of monkeypatching to avoid executing
 the actual functions.
 """
-import importlib
 import pytest
 
 import nominatim_db.indexer.indexer
@@ -28,6 +27,7 @@ def test_cli_help(cli_call, capsys):
     captured = capsys.readouterr()
     assert captured.out.startswith('usage:')
 
+
 def test_cli_version(cli_call, capsys):
     """ Running nominatim tool --version prints a version string.
     """
@@ -46,7 +46,6 @@ class TestCliWithDb:
         # Make sure tools.freeze.is_frozen doesn't report database as frozen. Monkeypatching failed
         table_factory('place')
 
-
     @pytest.mark.parametrize("name,oid", [('file', 'foo.osm'), ('diff', 'foo.osc')])
     def test_cli_add_data_file_command(self, cli_call, mock_func_factory, name, oid):
         mock_run_legacy = mock_func_factory(nominatim_db.tools.add_osm_data, 'add_data_from_file')
@@ -54,7 +53,6 @@ class TestCliWithDb:
 
         assert mock_run_legacy.called == 1
 
-
     @pytest.mark.parametrize("name,oid", [('node', 12), ('way', 8), ('relation', 32)])
     def test_cli_add_data_object_command(self, cli_call, mock_func_factory, name, oid):
         mock_run_legacy = mock_func_factory(nominatim_db.tools.add_osm_data, 'add_osm_object')
@@ -62,8 +60,6 @@ class TestCliWithDb:
 
         assert mock_run_legacy.called == 1
 
-
-
     def test_cli_add_data_tiger_data(self, cli_call, cli_tokenizer_mock, async_mock_func_factory):
         mock = async_mock_func_factory(nominatim_db.tools.tiger_data, 'add_tiger_data')
 
@@ -80,7 +76,6 @@ class TestCliWithDb:
         assert mock_drop.called == 1
         assert mock_flatnode.called == 1
 
-
     @pytest.mark.parametrize("params,do_bnds,do_ranks", [
                               ([], 2, 2),
                               (['--boundaries-only'], 2, 0),
@@ -89,11 +84,14 @@ class TestCliWithDb:
     def test_index_command(self, monkeypatch, async_mock_func_factory, table_factory,
                            params, do_bnds, do_ranks):
         table_factory('import_status', 'indexed bool')
-        bnd_mock = async_mock_func_factory(nominatim_db.indexer.indexer.Indexer, 'index_boundaries')
-        rank_mock = async_mock_func_factory(nominatim_db.indexer.indexer.Indexer, 'index_by_rank')
-        postcode_mock = async_mock_func_factory(nominatim_db.indexer.indexer.Indexer, 'index_postcodes')
-
-        monkeypatch.setattr(nominatim_db.indexer.indexer.Indexer, 'has_pending', 
+        bnd_mock = async_mock_func_factory(nominatim_db.indexer.indexer.Indexer,
+                                           'index_boundaries')
+        rank_mock = async_mock_func_factory(nominatim_db.indexer.indexer.Indexer,
+                                            'index_by_rank')
+        postcode_mock = async_mock_func_factory(nominatim_db.indexer.indexer.Indexer,
+                                                'index_postcodes')
+
+        monkeypatch.setattr(nominatim_db.indexer.indexer.Indexer, 'has_pending',
                             [False, True].pop)
 
         assert self.call_nominatim('index', *params) == 0
@@ -102,7 +100,6 @@ class TestCliWithDb:
         assert rank_mock.called == do_ranks
         assert postcode_mock.called == do_ranks
 
-
     def test_special_phrases_wiki_command(self, mock_func_factory):
         func = mock_func_factory(nominatim_db.clicmd.special_phrases.SPImporter, 'import_phrases')
 
@@ -110,7 +107,6 @@ class TestCliWithDb:
 
         assert func.called == 1
 
-
     def test_special_phrases_csv_command(self, src_dir, mock_func_factory):
         func = mock_func_factory(nominatim_db.clicmd.special_phrases.SPImporter, 'import_phrases')
         testdata = src_dir / 'test' / 'testdb'
@@ -120,7 +116,6 @@ class TestCliWithDb:
 
         assert func.called == 1
 
-
     def test_special_phrases_csv_bad_file(self, src_dir):
         testdata = src_dir / 'something349053905.csv'
 
diff --git a/test/python/cli/test_cmd_admin.py b/test/python/cli/test_cmd_admin.py
index 7b0b9cd4..9732d734 100644
--- a/test/python/cli/test_cmd_admin.py
+++ b/test/python/cli/test_cmd_admin.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Test for the command line interface wrapper admin subcommand.
@@ -39,11 +39,13 @@ def test_admin_clean_deleted_relations(cli_call, mock_func_factory):
     assert cli_call('admin', '--clean-deleted', '1 month') == 0
     assert mock.called == 1
 
+
 def test_admin_clean_deleted_relations_no_age(cli_call, mock_func_factory):
-    mock = mock_func_factory(nominatim_db.tools.admin, 'clean_deleted_relations')
+    mock_func_factory(nominatim_db.tools.admin, 'clean_deleted_relations')
 
     assert cli_call('admin', '--clean-deleted') == 1
 
+
 class TestCliAdminWithDb:
 
     @pytest.fixture(autouse=True)
@@ -51,7 +53,6 @@ class TestCliAdminWithDb:
         self.call_nominatim = cli_call
         self.tokenizer_mock = cli_tokenizer_mock
 
-
     @pytest.mark.parametrize("func, params", [('analyse_indexing', ('--analyse-indexing', ))])
     def test_analyse_indexing(self, mock_func_factory, func, params):
         mock = mock_func_factory(nominatim_db.tools.admin, func)
diff --git a/test/python/cli/test_cmd_api.py b/test/python/cli/test_cmd_api.py
index 1c0750d1..541b680c 100644
--- a/test/python/cli/test_cmd_api.py
+++ b/test/python/cli/test_cmd_api.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for API access commands of command-line interface wrapper.
@@ -10,9 +10,9 @@ Tests for API access commands of command-line interface wrapper.
 import json
 import pytest
 
-import nominatim_db.clicmd.api
 import nominatim_api as napi
 
+
 @pytest.mark.parametrize('call', ['search', 'reverse', 'lookup', 'details', 'status'])
 def test_list_format(cli_call, call):
     assert 0 == cli_call(call, '--list-formats')
@@ -30,13 +30,11 @@ class TestCliStatusCall:
         monkeypatch.setattr(napi.NominatimAPI, 'status',
                             lambda self: napi.StatusResult(200, 'OK'))
 
-
     def test_status_simple(self, cli_call, tmp_path):
         result = cli_call('status', '--project-dir', str(tmp_path))
 
         assert result == 0
 
-
     def test_status_json_format(self, cli_call, tmp_path, capsys):
         result = cli_call('status', '--project-dir', str(tmp_path),
                           '--format', 'json')
@@ -60,7 +58,6 @@ class TestCliDetailsCall:
                                         ('--way', '1'),
                                         ('--relation', '1'),
                                         ('--place_id', '10001')])
-
     def test_details_json_format(self, cli_call, tmp_path, capsys, params):
         result = cli_call('details', '--project-dir', str(tmp_path), *params)
 
@@ -75,15 +72,14 @@ class TestCliReverseCall:
     def setup_reverse_mock(self, monkeypatch):
         result = napi.ReverseResult(napi.SourceTable.PLACEX, ('place', 'thing'),
                                     napi.Point(1.0, -3.0),
-                                    names={'name':'Name', 'name:fr': 'Nom'},
-                                    extratags={'extra':'Extra'},
+                                    names={'name': 'Name', 'name:fr': 'Nom'},
+                                    extratags={'extra': 'Extra'},
                                     locale_name='Name',
                                     display_name='Name')
 
         monkeypatch.setattr(napi.NominatimAPI, 'reverse',
                             lambda *args, **kwargs: result)
 
-
     def test_reverse_simple(self, cli_call, tmp_path, capsys):
         result = cli_call('reverse', '--project-dir', str(tmp_path),
                           '--lat', '34', '--lon', '34')
@@ -96,7 +92,6 @@ class TestCliReverseCall:
         assert 'extratags' not in out
         assert 'namedetails' not in out
 
-
     @pytest.mark.parametrize('param,field', [('--addressdetails', 'address'),
                                              ('--extratags', 'extratags'),
                                              ('--namedetails', 'namedetails')])
@@ -109,7 +104,6 @@ class TestCliReverseCall:
         out = json.loads(capsys.readouterr().out)
         assert field in out
 
-
     def test_reverse_format(self, cli_call, tmp_path, capsys):
         result = cli_call('reverse', '--project-dir', str(tmp_path),
                           '--lat', '34', '--lon', '34', '--format', 'geojson')
@@ -125,11 +119,11 @@ class TestCliLookupCall:
     @pytest.fixture(autouse=True)
     def setup_lookup_mock(self, monkeypatch):
         result = napi.SearchResult(napi.SourceTable.PLACEX, ('place', 'thing'),
-                                    napi.Point(1.0, -3.0),
-                                    names={'name':'Name', 'name:fr': 'Nom'},
-                                    extratags={'extra':'Extra'},
-                                    locale_name='Name',
-                                    display_name='Name')
+                                   napi.Point(1.0, -3.0),
+                                   names={'name': 'Name', 'name:fr': 'Nom'},
+                                   extratags={'extra': 'Extra'},
+                                   locale_name='Name',
+                                   display_name='Name')
 
         monkeypatch.setattr(napi.NominatimAPI, 'lookup',
                             lambda *args, **kwargs: napi.SearchResults([result]))
@@ -150,19 +144,18 @@ class TestCliLookupCall:
 
 @pytest.mark.parametrize('endpoint, params', [('search', ('--query', 'Berlin')),
                                               ('search_address', ('--city', 'Berlin'))
-                                             ])
+                                              ])
 def test_search(cli_call, tmp_path, capsys, monkeypatch, endpoint, params):
     result = napi.SearchResult(napi.SourceTable.PLACEX, ('place', 'thing'),
                                napi.Point(1.0, -3.0),
-                               names={'name':'Name', 'name:fr': 'Nom'},
-                               extratags={'extra':'Extra'},
+                               names={'name': 'Name', 'name:fr': 'Nom'},
+                               extratags={'extra': 'Extra'},
                                locale_name='Name',
                                display_name='Name')
 
     monkeypatch.setattr(napi.NominatimAPI, endpoint,
                         lambda *args, **kwargs: napi.SearchResults([result]))
 
-
     result = cli_call('search', '--project-dir', str(tmp_path), *params)
 
     assert result == 0
diff --git a/test/python/cli/test_cmd_import.py b/test/python/cli/test_cmd_import.py
index f833dde3..e4a86fe0 100644
--- a/test/python/cli/test_cmd_import.py
+++ b/test/python/cli/test_cmd_import.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for import command of the command-line interface wrapper.
@@ -24,15 +24,12 @@ class TestCliImportWithDb:
         self.call_nominatim = cli_call
         self.tokenizer_mock = cli_tokenizer_mock
 
-
     def test_import_missing_file(self):
         assert self.call_nominatim('import', '--osm-file', 'sfsafegwedgw.reh.erh') == 1
 
-
     def test_import_bad_file(self):
         assert self.call_nominatim('import', '--osm-file', '.') == 1
 
-
     @pytest.mark.parametrize('with_updates', [True, False])
     def test_import_full(self, mock_func_factory, async_mock_func_factory,
                          with_updates, place_table, property_table):
@@ -62,7 +59,6 @@ class TestCliImportWithDb:
 
         cf_mock = mock_func_factory(nominatim_db.tools.refresh, 'create_functions')
 
-
         assert self.call_nominatim(*params) == 0
         assert self.tokenizer_mock.finalize_import_called
 
@@ -71,7 +67,6 @@ class TestCliImportWithDb:
         for mock in mocks:
             assert mock.called == 1, "Mock '{}' not called".format(mock.func_name)
 
-
     def test_import_continue_load_data(self, mock_func_factory, async_mock_func_factory):
         mocks = [
             mock_func_factory(nominatim_db.tools.database_import, 'truncate_data_tables'),
@@ -89,7 +84,6 @@ class TestCliImportWithDb:
         for mock in mocks:
             assert mock.called == 1, "Mock '{}' not called".format(mock.func_name)
 
-
     def test_import_continue_indexing(self, mock_func_factory, async_mock_func_factory,
                                       placex_table, temp_db_conn):
         mocks = [
@@ -107,7 +101,6 @@ class TestCliImportWithDb:
         # Calling it again still works for the index
         assert self.call_nominatim('import', '--continue', 'indexing') == 0
 
-
     def test_import_continue_postprocess(self, mock_func_factory, async_mock_func_factory):
         mocks = [
             async_mock_func_factory(nominatim_db.tools.database_import, 'create_search_indices'),
diff --git a/test/python/cli/test_cmd_refresh.py b/test/python/cli/test_cmd_refresh.py
index 9f3d7bb2..8121946f 100644
--- a/test/python/cli/test_cmd_refresh.py
+++ b/test/python/cli/test_cmd_refresh.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for command line interface wrapper for refresk command.
@@ -13,6 +13,7 @@ import nominatim_db.tools.refresh
 import nominatim_db.tools.postcodes
 import nominatim_db.indexer.indexer
 
+
 class TestRefresh:
 
     @pytest.fixture(autouse=True)
@@ -20,7 +21,6 @@ class TestRefresh:
         self.call_nominatim = cli_call
         self.tokenizer_mock = cli_tokenizer_mock
 
-
     @pytest.mark.parametrize("command,func", [
                              ('address-levels', 'load_address_levels_from_config'),
                              ('wiki-data', 'import_wikipedia_articles'),
@@ -33,17 +33,14 @@ class TestRefresh:
         assert self.call_nominatim('refresh', '--' + command) == 0
         assert func_mock.called == 1
 
-
     def test_refresh_word_count(self):
         assert self.call_nominatim('refresh', '--word-count') == 0
         assert self.tokenizer_mock.update_statistics_called
 
-
     def test_refresh_word_tokens(self):
         assert self.call_nominatim('refresh', '--word-tokens') == 0
         assert self.tokenizer_mock.update_word_tokens_called
 
-
     def test_refresh_postcodes(self, async_mock_func_factory, mock_func_factory, place_table):
         func_mock = mock_func_factory(nominatim_db.tools.postcodes, 'update_postcodes')
         idx_mock = async_mock_func_factory(nominatim_db.indexer.indexer.Indexer, 'index_postcodes')
@@ -52,12 +49,10 @@ class TestRefresh:
         assert func_mock.called == 1
         assert idx_mock.called == 1
 
-
     def test_refresh_postcodes_no_place_table(self):
         # Do nothing without the place table
         assert self.call_nominatim('refresh', '--postcodes') == 0
 
-
     def test_refresh_create_functions(self, mock_func_factory):
         func_mock = mock_func_factory(nominatim_db.tools.refresh, 'create_functions')
 
@@ -65,17 +60,14 @@ class TestRefresh:
         assert func_mock.called == 1
         assert self.tokenizer_mock.update_sql_functions_called
 
-
     def test_refresh_wikidata_file_not_found(self, monkeypatch):
         monkeypatch.setenv('NOMINATIM_WIKIPEDIA_DATA_PATH', 'gjoiergjeroi345Q')
 
         assert self.call_nominatim('refresh', '--wiki-data') == 1
 
-
     def test_refresh_secondary_importance_file_not_found(self):
         assert self.call_nominatim('refresh', '--secondary-importance') == 1
 
-
     def test_refresh_secondary_importance_new_table(self, mock_func_factory):
         mocks = [mock_func_factory(nominatim_db.tools.refresh, 'import_secondary_importance'),
                  mock_func_factory(nominatim_db.tools.refresh, 'create_functions')]
@@ -84,7 +76,6 @@ class TestRefresh:
         assert mocks[0].called == 1
         assert mocks[1].called == 1
 
-
     def test_refresh_importance_computed_after_wiki_import(self, monkeypatch, mock_func_factory):
         calls = []
         monkeypatch.setattr(nominatim_db.tools.refresh, 'import_wikipedia_articles',
@@ -102,7 +93,8 @@ class TestRefresh:
                                         ('--data-object', 'N23', '--data-object', 'N24'),
                                         ('--data-area', 'R7723'),
                                         ('--data-area', 'r7723', '--data-area', 'r2'),
-                                        ('--data-area', 'R9284425', '--data-object', 'n1234567894567')])
+                                        ('--data-area', 'R9284425',
+                                         '--data-object', 'n1234567894567')])
     def test_refresh_objects(self, params, mock_func_factory):
         func_mock = mock_func_factory(nominatim_db.tools.refresh, 'invalidate_osm_object')
 
@@ -110,7 +102,6 @@ class TestRefresh:
 
         assert func_mock.called == len(params)/2
 
-
     @pytest.mark.parametrize('func', ('--data-object', '--data-area'))
     @pytest.mark.parametrize('param', ('234', 'a55', 'R 453', 'Rel'))
     def test_refresh_objects_bad_param(self, func, param, mock_func_factory):
diff --git a/test/python/cli/test_cmd_replication.py b/test/python/cli/test_cmd_replication.py
index 21c6350d..8ec17eaa 100644
--- a/test/python/cli/test_cmd_replication.py
+++ b/test/python/cli/test_cmd_replication.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2023 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for replication command of command-line interface wrapper.
@@ -18,6 +18,7 @@ import nominatim_db.tools.replication
 import nominatim_db.tools.refresh
 from nominatim_db.db import status
 
+
 @pytest.fixture
 def tokenizer_mock(monkeypatch):
     class DummyTokenizer:
@@ -40,7 +41,6 @@ def tokenizer_mock(monkeypatch):
     return tok
 
 
-
 @pytest.fixture
 def init_status(temp_db_conn, status_table):
     status.set_status(temp_db_conn, date=dt.datetime.now(dt.timezone.utc), seq=1)
@@ -62,16 +62,14 @@ class TestCliReplication:
     def setup_cli_call(self, cli_call, temp_db):
         self.call_nominatim = lambda *args: cli_call('replication', *args)
 
-
     @pytest.fixture(autouse=True)
     def setup_update_function(self, monkeypatch):
         def _mock_updates(states):
             monkeypatch.setattr(nominatim_db.tools.replication, 'update',
-                            lambda *args, **kwargs: states.pop())
+                                lambda *args, **kwargs: states.pop())
 
         self.update_states = _mock_updates
 
-
     @pytest.mark.parametrize("params,func", [
                              (('--init',), 'init_replication'),
                              (('--init', '--no-update-functions'), 'init_replication'),
@@ -88,36 +86,32 @@ class TestCliReplication:
         if params == ('--init',):
             assert umock.called == 1
 
-
     def test_replication_update_bad_interval(self, monkeypatch):
         monkeypatch.setenv('NOMINATIM_REPLICATION_UPDATE_INTERVAL', 'xx')
 
         assert self.call_nominatim() == 1
 
-
     def test_replication_update_bad_interval_for_geofabrik(self, monkeypatch):
         monkeypatch.setenv('NOMINATIM_REPLICATION_URL',
                            'https://download.geofabrik.de/europe/italy-updates')
 
         assert self.call_nominatim() == 1
 
-
     def test_replication_update_continuous_no_index(self):
         assert self.call_nominatim('--no-index') == 1
 
-    def test_replication_update_once_no_index(self, update_mock):
+    def test_replication_update_once_no_index(self, update_mock, monkeypatch):
+        monkeypatch.setenv('NOMINATIM_OSM2PGSQL_BINARY', 'OSM2PGSQL NOT AVAILABLE')
         assert self.call_nominatim('--once', '--no-index') == 0
 
         assert str(update_mock.last_args[1]['osm2pgsql']).endswith('OSM2PGSQL NOT AVAILABLE')
 
-
     def test_replication_update_custom_osm2pgsql(self, monkeypatch, update_mock):
         monkeypatch.setenv('NOMINATIM_OSM2PGSQL_BINARY', '/secret/osm2pgsql')
         assert self.call_nominatim('--once', '--no-index') == 0
 
         assert str(update_mock.last_args[1]['osm2pgsql']) == '/secret/osm2pgsql'
 
-
     @pytest.mark.parametrize("update_interval", [60, 3600])
     def test_replication_catchup(self, placex_table, monkeypatch, index_mock, update_interval):
         monkeypatch.setenv('NOMINATIM_REPLICATION_UPDATE_INTERVAL', str(update_interval))
@@ -125,13 +119,11 @@ class TestCliReplication:
 
         assert self.call_nominatim('--catch-up') == 0
 
-
     def test_replication_update_custom_threads(self, update_mock):
         assert self.call_nominatim('--once', '--no-index', '--threads', '4') == 0
 
         assert update_mock.last_args[1]['threads'] == 4
 
-
     def test_replication_update_continuous(self, index_mock):
         self.update_states([nominatim_db.tools.replication.UpdateState.UP_TO_DATE,
                             nominatim_db.tools.replication.UpdateState.UP_TO_DATE])
@@ -141,7 +133,6 @@ class TestCliReplication:
 
         assert index_mock.called == 2
 
-
     def test_replication_update_continuous_no_change(self, mock_func_factory,
                                                      index_mock):
         self.update_states([nominatim_db.tools.replication.UpdateState.NO_CHANGES,
diff --git a/test/python/config/test_config.py b/test/python/config/test_config.py
index 8f90b5da..a0dbf476 100644
--- a/test/python/config/test_config.py
+++ b/test/python/config/test_config.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Test for loading dotenv configuration.
@@ -13,6 +13,7 @@ import pytest
 from nominatim_db.config import Configuration, flatten_config_list
 from nominatim_db.errors import UsageError
 
+
 @pytest.fixture
 def make_config():
     """ Create a configuration object from the given project directory.
@@ -22,6 +23,7 @@ def make_config():
 
     return _mk_config
 
+
 @pytest.fixture
 def make_config_path(tmp_path):
     """ Create a configuration object with project and config directories
@@ -108,7 +110,7 @@ def test_get_libpq_dsn_convert_php(make_config, monkeypatch):
 
 @pytest.mark.parametrize("val,expect", [('foo bar', "'foo bar'"),
                                         ("xy'z", "xy\\'z"),
-                                       ])
+                                        ])
 def test_get_libpq_dsn_convert_php_special_chars(make_config, monkeypatch, val, expect):
     config = make_config()
 
@@ -137,6 +139,7 @@ def test_get_bool(make_config, monkeypatch, value, result):
 
     assert config.get_bool('FOOBAR') == result
 
+
 def test_get_bool_empty(make_config):
     config = make_config()
 
@@ -222,7 +225,7 @@ def test_get_import_style_intern(make_config, src_dir, monkeypatch):
 
     monkeypatch.setenv('NOMINATIM_IMPORT_STYLE', 'street')
 
-    expected = src_dir / 'settings' / 'import-street.lua'
+    expected = src_dir / 'lib-lua' / 'import-street.lua'
 
     assert config.get_import_style_file() == expected
 
@@ -303,7 +306,7 @@ def test_load_subconf_env_absolute_not_found(make_config_path, monkeypatch, tmp_
     (config.config_dir / 'test.yaml').write_text('cow: muh\ncat: miau\n')
 
     with pytest.raises(UsageError, match='Config file not found.'):
-        rules = config.load_sub_configuration('test.yaml', config='MY_CONFIG')
+        config.load_sub_configuration('test.yaml', config='MY_CONFIG')
 
 
 @pytest.mark.parametrize("location", ['project_dir', 'config_dir'])
@@ -326,7 +329,7 @@ def test_load_subconf_env_relative_not_found(make_config_path, monkeypatch):
     (config.config_dir / 'test.yaml').write_text('cow: muh\ncat: miau\n')
 
     with pytest.raises(UsageError, match='Config file not found.'):
-        rules = config.load_sub_configuration('test.yaml', config='MY_CONFIG')
+        config.load_sub_configuration('test.yaml', config='MY_CONFIG')
 
 
 def test_load_subconf_json(make_config_path):
@@ -338,6 +341,7 @@ def test_load_subconf_json(make_config_path):
 
     assert rules == dict(cow='muh', cat='miau')
 
+
 def test_load_subconf_not_found(make_config_path):
     config = make_config_path()
 
@@ -371,7 +375,7 @@ def test_load_subconf_include_relative(make_config_path, tmp_path, location):
     config = make_config_path()
 
     testfile = config.config_dir / 'test.yaml'
-    testfile.write_text(f'base: !include inc.yaml\n')
+    testfile.write_text('base: !include inc.yaml\n')
     (getattr(config, location) / 'inc.yaml').write_text('first: 1\nsecond: 2\n')
 
     rules = config.load_sub_configuration('test.yaml')
@@ -383,28 +387,28 @@ def test_load_subconf_include_bad_format(make_config_path):
     config = make_config_path()
 
     testfile = config.config_dir / 'test.yaml'
-    testfile.write_text(f'base: !include inc.txt\n')
+    testfile.write_text('base: !include inc.txt\n')
     (config.config_dir / 'inc.txt').write_text('first: 1\nsecond: 2\n')
 
     with pytest.raises(UsageError, match='Cannot handle config file format.'):
-        rules = config.load_sub_configuration('test.yaml')
+        config.load_sub_configuration('test.yaml')
 
 
 def test_load_subconf_include_not_found(make_config_path):
     config = make_config_path()
 
     testfile = config.config_dir / 'test.yaml'
-    testfile.write_text(f'base: !include inc.txt\n')
+    testfile.write_text('base: !include inc.txt\n')
 
     with pytest.raises(UsageError, match='Config file not found.'):
-        rules = config.load_sub_configuration('test.yaml')
+        config.load_sub_configuration('test.yaml')
 
 
 def test_load_subconf_include_recursive(make_config_path):
     config = make_config_path()
 
     testfile = config.config_dir / 'test.yaml'
-    testfile.write_text(f'base: !include inc.yaml\n')
+    testfile.write_text('base: !include inc.yaml\n')
     (config.config_dir / 'inc.yaml').write_text('- !include more.yaml\n- upper\n')
     (config.config_dir / 'more.yaml').write_text('- the end\n')
 
@@ -435,6 +439,6 @@ def test_flatten_config_list_nested():
         [[2, 3], [45, [56, 78], 66]],
         'end'
     ]
+
     assert flatten_config_list(content) == \
-               [34, {'first': '1st', 'second': '2nd'}, {},
-                2, 3, 45, 56, 78, 66, 'end']
+        [34, {'first': '1st', 'second': '2nd'}, {}, 2, 3, 45, 56, 78, 66, 'end']
diff --git a/test/python/config/test_config_load_module.py b/test/python/config/test_config_load_module.py
index c2912180..309bd1fc 100644
--- a/test/python/config/test_config_load_module.py
+++ b/test/python/config/test_config_load_module.py
@@ -2,18 +2,18 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Test for loading extra Python modules.
 """
-from pathlib import Path
 import sys
 
 import pytest
 
 from nominatim_db.config import Configuration
 
+
 @pytest.fixture
 def test_config(src_dir, tmp_path):
     """ Create a configuration object with project and config directories
@@ -31,6 +31,7 @@ def test_load_default_module(test_config):
 
     assert isinstance(module.NOMINATIM_VERSION, tuple)
 
+
 def test_load_default_module_with_hyphen(test_config):
     module = test_config.load_plugin_module('place-info', 'nominatim_db.data')
 
diff --git a/test/python/conftest.py b/test/python/conftest.py
index a25ff8ec..046ee5a6 100644
--- a/test/python/conftest.py
+++ b/test/python/conftest.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 import itertools
 import sys
@@ -69,6 +69,7 @@ def temp_db_with_extensions(temp_db):
 
     return temp_db
 
+
 @pytest.fixture
 def temp_db_conn(temp_db):
     """ Connection to the test database.
@@ -100,8 +101,9 @@ def table_factory(temp_db_conn):
             if content:
                 sql = pysql.SQL("INSERT INTO {} VALUES ({})")\
                            .format(pysql.Identifier(name),
-                                   pysql.SQL(',').join([pysql.Placeholder() for _ in range(len(content[0]))]))
-                cur.executemany(sql , content)
+                                   pysql.SQL(',').join([pysql.Placeholder()
+                                                        for _ in range(len(content[0]))]))
+                cur.executemany(sql, content)
 
     return mk_table
 
@@ -109,7 +111,6 @@ def table_factory(temp_db_conn):
 @pytest.fixture
 def def_config():
     cfg = Configuration(None)
-    cfg.set_libdirs(osm2pgsql=None)
     return cfg
 
 
@@ -118,7 +119,6 @@ def project_env(tmp_path):
     projdir = tmp_path / 'project'
     projdir.mkdir()
     cfg = Configuration(projdir)
-    cfg.set_libdirs(osm2pgsql=None)
     return cfg
 
 
@@ -178,6 +178,7 @@ def place_row(place_table, temp_db_cursor):
 
     return _insert
 
+
 @pytest.fixture
 def placex_table(temp_db_with_extensions, temp_db_conn):
     """ Create an empty version of the place table.
@@ -208,7 +209,7 @@ def osmline_table(temp_db_with_extensions, table_factory):
 def sql_preprocessor_cfg(tmp_path, table_factory, temp_db_with_extensions):
     table_factory('country_name', 'partition INT', ((0, ), (1, ), (2, )))
     cfg = Configuration(None)
-    cfg.set_libdirs(osm2pgsql=None, sql=tmp_path)
+    cfg.set_libdirs(sql=tmp_path)
     return cfg
 
 
@@ -233,6 +234,6 @@ def tokenizer_mock(monkeypatch, property_table):
     property_table.set('tokenizer', 'dummy')
 
     def _create_tokenizer():
-        return dummy_tokenizer.DummyTokenizer(None, None)
+        return dummy_tokenizer.DummyTokenizer(None)
 
     return _create_tokenizer
diff --git a/test/python/cursor.py b/test/python/cursor.py
index b3fc260a..5dc93cd5 100644
--- a/test/python/cursor.py
+++ b/test/python/cursor.py
@@ -2,13 +2,14 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Specialised psycopg cursor with shortcut functions useful for testing.
 """
 import psycopg
 
+
 class CursorForTesting(psycopg.Cursor):
     """ Extension to the DictCursor class that provides execution
         short-cuts that simplify writing assertions.
@@ -22,7 +23,6 @@ class CursorForTesting(psycopg.Cursor):
         assert self.rowcount == 1
         return self.fetchone()[0]
 
-
     def row_set(self, sql, params=None):
         """ Execute a query and return the result as a set of tuples.
             Fails when the SQL command returns duplicate rows.
@@ -34,7 +34,6 @@ class CursorForTesting(psycopg.Cursor):
 
         return result
 
-
     def table_exists(self, table):
         """ Check that a table with the given name exists in the database.
         """
@@ -42,7 +41,6 @@ class CursorForTesting(psycopg.Cursor):
                              WHERE tablename = %s""", (table, ))
         return num == 1
 
-
     def index_exists(self, table, index):
         """ Check that an indexwith the given name exists on the given table.
         """
@@ -51,7 +49,6 @@ class CursorForTesting(psycopg.Cursor):
                           (table, index))
         return num == 1
 
-
     def table_rows(self, table, where=None):
         """ Return the number of rows in the given table.
         """
diff --git a/test/python/data/test_country_info.py b/test/python/data/test_country_info.py
index 14b306bb..a85b7bf9 100644
--- a/test/python/data/test_country_info.py
+++ b/test/python/data/test_country_info.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for function that handle country properties.
@@ -12,6 +12,7 @@ import pytest
 
 from nominatim_db.data import country_info
 
+
 @pytest.fixture
 def loaded_country(def_config):
     country_info.setup_country_config(def_config)
@@ -115,8 +116,8 @@ def test_setup_country_config_languages_not_loaded(env_with_country_config):
     info = country_info._CountryInfo()
     info.load(config)
     assert dict(info.items()) == {'de': {'partition': 3,
-                                  'languages': [],
-                                  'names': {'name': 'Deutschland'}}}
+                                         'languages': [],
+                                         'names': {'name': 'Deutschland'}}}
 
 
 def test_setup_country_config_name_not_loaded(env_with_country_config):
@@ -132,8 +133,7 @@ def test_setup_country_config_name_not_loaded(env_with_country_config):
 
     assert dict(info.items()) == {'de': {'partition': 3,
                                          'languages': ['de'],
-                                         'names': {}
-                                 }}
+                                         'names': {}}}
 
 
 def test_setup_country_config_names_not_loaded(env_with_country_config):
@@ -148,8 +148,7 @@ def test_setup_country_config_names_not_loaded(env_with_country_config):
 
     assert dict(info.items()) == {'de': {'partition': 3,
                                          'languages': ['de'],
-                                         'names': {}
-                                 }}
+                                         'names': {}}}
 
 
 def test_setup_country_config_special_character(env_with_country_config):
@@ -157,8 +156,8 @@ def test_setup_country_config_special_character(env_with_country_config):
                                      bq:
                                          partition: 250
                                          languages: nl
-                                         names: 
-                                             name: 
+                                         names:
+                                             name:
                                                  default: "\\N"
                                      """)
 
@@ -167,5 +166,4 @@ def test_setup_country_config_special_character(env_with_country_config):
 
     assert dict(info.items()) == {'bq': {'partition': 250,
                                          'languages': ['nl'],
-                                         'names': {'name': '\x85'}
-                                 }}
+                                         'names': {'name': '\x85'}}}
diff --git a/test/python/db/test_connection.py b/test/python/db/test_connection.py
index a8b5d677..19b945fd 100644
--- a/test/python/db/test_connection.py
+++ b/test/python/db/test_connection.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for specialised connection and cursor classes.
@@ -12,6 +12,7 @@ import psycopg
 
 import nominatim_db.db.connection as nc
 
+
 @pytest.fixture
 def db(dsn):
     with nc.connect(dsn) as conn:
@@ -36,6 +37,7 @@ def test_has_column(db, table_factory, name, result):
 
     assert nc.table_has_column(db, 'stuff', name) == result
 
+
 def test_connection_index_exists(db, table_factory, temp_db_cursor):
     assert not nc.index_exists(db, 'some_index')
 
@@ -76,6 +78,7 @@ def test_drop_table_non_existing_force(db):
     with pytest.raises(psycopg.ProgrammingError, match='.*does not exist.*'):
         nc.drop_tables(db, 'dfkjgjriogjigjgjrdghehtre', if_exists=False)
 
+
 def test_connection_server_version_tuple(db):
     ver = nc.server_version_tuple(db)
 
diff --git a/test/python/db/test_properties.py b/test/python/db/test_properties.py
index e55bb973..84d7dae0 100644
--- a/test/python/db/test_properties.py
+++ b/test/python/db/test_properties.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for property table manpulation.
@@ -11,6 +11,7 @@ import pytest
 
 from nominatim_db.db import properties
 
+
 @pytest.fixture
 def property_factory(property_table, temp_db_cursor):
     """ A function fixture that adds a property into the property table.
diff --git a/test/python/db/test_sql_preprocessor.py b/test/python/db/test_sql_preprocessor.py
index 45109c70..f2fbbb2a 100644
--- a/test/python/db/test_sql_preprocessor.py
+++ b/test/python/db/test_sql_preprocessor.py
@@ -2,16 +2,17 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for SQL preprocessing.
 """
 import pytest
-import pytest_asyncio
+import pytest_asyncio  # noqa
 
 from nominatim_db.db.sql_preprocessor import SQLPreprocessor
 
+
 @pytest.fixture
 def sql_factory(tmp_path):
     def _mk_sql(sql_body):
@@ -26,6 +27,7 @@ def sql_factory(tmp_path):
 
     return _mk_sql
 
+
 @pytest.mark.parametrize("expr,ret", [
     ("'a'", 'a'),
     ("'{{db.partitions|join}}'", '012'),
@@ -61,8 +63,7 @@ def test_load_file_with_params(sql_preprocessor, sql_factory, temp_db_conn, temp
 async def test_load_parallel_file(dsn, sql_preprocessor, tmp_path, temp_db_cursor):
     (tmp_path / 'test.sql').write_text("""
         CREATE TABLE foo (a TEXT);
-        CREATE TABLE foo2(a TEXT);""" + 
-        "\n---\nCREATE TABLE bar (b INT);")
+        CREATE TABLE foo2(a TEXT);""" + "\n---\nCREATE TABLE bar (b INT);")
 
     await sql_preprocessor.run_parallel_sql_file(dsn, 'test.sql', num_threads=4)
 
diff --git a/test/python/db/test_status.py b/test/python/db/test_status.py
index 77135a8c..462b8e3d 100644
--- a/test/python/db/test_status.py
+++ b/test/python/db/test_status.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for status table manipulation.
@@ -19,7 +19,8 @@ OSM_NODE_DATA = """\
 <node id="45673" visible="true" version="1" changeset="2047" timestamp="2006-01-27T22:09:10Z" user="Foo" uid="111" lat="48.7586670" lon="8.1343060">
 </node>
 </osm>
-"""
+"""  # noqa
+
 
 def iso_date(date):
     return dt.datetime.strptime(date, nominatim_db.db.status.ISODATE_FORMAT)\
@@ -43,7 +44,8 @@ def test_compute_database_date_from_osm2pgsql(table_factory, temp_db_conn, offli
 def test_compute_database_date_from_osm2pgsql_nodata(table_factory, temp_db_conn):
     table_factory('osm2pgsql_properties', 'property TEXT, value TEXT')
 
-    with pytest.raises(UsageError, match='Cannot determine database date from data in offline mode'):
+    with pytest.raises(UsageError,
+                       match='Cannot determine database date from data in offline mode'):
         nominatim_db.db.status.compute_database_date(temp_db_conn, offline=True)
 
 
@@ -56,6 +58,7 @@ def test_compute_database_date_valid(monkeypatch, place_row, temp_db_conn):
     place_row(osm_type='N', osm_id=45673)
 
     requested_url = []
+
     def mock_url(url):
         requested_url.append(url)
         return OSM_NODE_DATA
@@ -72,6 +75,7 @@ def test_compute_database_broken_api(monkeypatch, place_row, temp_db_conn):
     place_row(osm_type='N', osm_id=45673)
 
     requested_url = []
+
     def mock_url(url):
         requested_url.append(url)
         return '<osm version="0.6" generator="OpenStre'
@@ -86,8 +90,7 @@ def test_set_status_empty_table(temp_db_conn, temp_db_cursor):
     date = dt.datetime.fromordinal(1000000).replace(tzinfo=dt.timezone.utc)
     nominatim_db.db.status.set_status(temp_db_conn, date=date)
 
-    assert temp_db_cursor.row_set("SELECT * FROM import_status") == \
-             {(date, None, True)}
+    assert temp_db_cursor.row_set("SELECT * FROM import_status") == {(date, None, True)}
 
 
 def test_set_status_filled_table(temp_db_conn, temp_db_cursor):
@@ -99,8 +102,7 @@ def test_set_status_filled_table(temp_db_conn, temp_db_cursor):
     date = dt.datetime.fromordinal(1000100).replace(tzinfo=dt.timezone.utc)
     nominatim_db.db.status.set_status(temp_db_conn, date=date, seq=456, indexed=False)
 
-    assert temp_db_cursor.row_set("SELECT * FROM import_status") == \
-             {(date, 456, False)}
+    assert temp_db_cursor.row_set("SELECT * FROM import_status") == {(date, 456, False)}
 
 
 def test_set_status_missing_date(temp_db_conn, temp_db_cursor):
@@ -111,8 +113,7 @@ def test_set_status_missing_date(temp_db_conn, temp_db_cursor):
 
     nominatim_db.db.status.set_status(temp_db_conn, date=None, seq=456, indexed=False)
 
-    assert temp_db_cursor.row_set("SELECT * FROM import_status") == \
-             {(date, 456, False)}
+    assert temp_db_cursor.row_set("SELECT * FROM import_status") == {(date, 456, False)}
 
 
 def test_get_status_empty_table(temp_db_conn):
@@ -123,8 +124,7 @@ def test_get_status_success(temp_db_conn):
     date = dt.datetime.fromordinal(1000000).replace(tzinfo=dt.timezone.utc)
     nominatim_db.db.status.set_status(temp_db_conn, date=date, seq=667, indexed=False)
 
-    assert nominatim_db.db.status.get_status(temp_db_conn) == \
-             (date, 667, False)
+    assert nominatim_db.db.status.get_status(temp_db_conn) == (date, 667, False)
 
 
 @pytest.mark.parametrize("old_state", [True, False])
diff --git a/test/python/db/test_utils.py b/test/python/db/test_utils.py
index 7c46846d..2bc7d959 100644
--- a/test/python/db/test_utils.py
+++ b/test/python/db/test_utils.py
@@ -2,18 +2,17 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for DB utility functions in db.utils
 """
-import json
-
 import pytest
 
 import nominatim_db.db.utils as db_utils
 from nominatim_db.errors import UsageError
 
+
 def test_execute_file_success(dsn, temp_db_cursor, tmp_path):
     tmpfile = tmp_path / 'test.sql'
     tmpfile.write_text('CREATE TABLE test (id INT);\nINSERT INTO test VALUES(56);')
@@ -22,6 +21,7 @@ def test_execute_file_success(dsn, temp_db_cursor, tmp_path):
 
     assert temp_db_cursor.row_set('SELECT * FROM test') == {(56, )}
 
+
 def test_execute_file_bad_file(dsn, tmp_path):
     with pytest.raises(FileNotFoundError):
         db_utils.execute_file(dsn, tmp_path / 'test2.sql')
diff --git a/test/python/dummy_tokenizer.py b/test/python/dummy_tokenizer.py
index 4739e3f0..ce74004a 100644
--- a/test/python/dummy_tokenizer.py
+++ b/test/python/dummy_tokenizer.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tokenizer for testing.
@@ -10,36 +10,33 @@ Tokenizer for testing.
 from nominatim_db.data.place_info import PlaceInfo
 from nominatim_db.config import Configuration
 
-def create(dsn, data_dir):
+
+def create(dsn):
     """ Create a new instance of the tokenizer provided by this module.
     """
-    return DummyTokenizer(dsn, data_dir)
+    return DummyTokenizer(dsn)
+
 
 class DummyTokenizer:
 
-    def __init__(self, dsn, data_dir):
+    def __init__(self, dsn):
         self.dsn = dsn
-        self.data_dir = data_dir
         self.init_state = None
         self.analyser_cache = {}
 
-
     def init_new_db(self, *args, **kwargs):
         assert self.init_state is None
         self.init_state = "new"
 
-
     def init_from_project(self, config):
         assert isinstance(config, Configuration)
         assert self.init_state is None
         self.init_state = "loaded"
 
-
     @staticmethod
     def finalize_import(_):
         pass
 
-
     def name_analyzer(self):
         return DummyNameAnalyzer(self.analyser_cache)
 
@@ -52,12 +49,10 @@ class DummyNameAnalyzer:
     def __exit__(self, exc_type, exc_value, traceback):
         self.close()
 
-
     def __init__(self, cache):
         self.analyser_cache = cache
         cache['countries'] = []
 
-
     def close(self):
         pass
 
diff --git a/test/python/indexer/test_indexing.py b/test/python/indexer/test_indexing.py
index fe65b69c..79b76c60 100644
--- a/test/python/indexer/test_indexing.py
+++ b/test/python/indexer/test_indexing.py
@@ -2,18 +2,19 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for running the indexing.
 """
 import itertools
 import pytest
-import pytest_asyncio
+import pytest_asyncio  # noqa
 
 from nominatim_db.indexer import indexer
 from nominatim_db.tokenizer import factory
 
+
 class IndexerTestDB:
 
     def __init__(self, conn):
@@ -232,6 +233,7 @@ async def test_index_partial_with_30(test_db, threads, test_tokenizer):
                     SELECT count(*) FROM placex
                       WHERE indexed_status = 0 AND rank_address between 1 and 27""") == 0
 
+
 @pytest.mark.parametrize("threads", [1, 15])
 @pytest.mark.asyncio
 async def test_index_boundaries(test_db, threads, test_tokenizer):
diff --git a/test/python/mock_icu_word_table.py b/test/python/mock_icu_word_table.py
index e8b4390f..b26025a0 100644
--- a/test/python/mock_icu_word_table.py
+++ b/test/python/mock_icu_word_table.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Legacy word table for testing with functions to prefil and test contents
@@ -10,6 +10,7 @@ of the table.
 """
 from nominatim_db.db.connection import execute_scalar
 
+
 class MockIcuWordTable:
     """ A word table for testing using legacy word table structure.
     """
@@ -31,7 +32,6 @@ class MockIcuWordTable:
                         (word_id, word or word_token, word))
         self.conn.commit()
 
-
     def add_special(self, word_token, word, cls, typ, oper):
         with self.conn.cursor() as cur:
             cur.execute("""INSERT INTO word (word_token, type, word, info)
@@ -42,7 +42,6 @@ class MockIcuWordTable:
                         """, (word_token, word, cls, typ, oper))
         self.conn.commit()
 
-
     def add_country(self, country_code, word_token):
         with self.conn.cursor() as cur:
             cur.execute("""INSERT INTO word (word_token, type, word)
@@ -50,7 +49,6 @@ class MockIcuWordTable:
                         (word_token, country_code))
         self.conn.commit()
 
-
     def add_postcode(self, word_token, postcode):
         with self.conn.cursor() as cur:
             cur.execute("""INSERT INTO word (word_token, type, word)
@@ -58,7 +56,6 @@ class MockIcuWordTable:
                         """, (word_token, postcode))
         self.conn.commit()
 
-
     def add_housenumber(self, word_id, word_tokens, word=None):
         with self.conn.cursor() as cur:
             if isinstance(word_tokens, str):
@@ -71,24 +68,21 @@ class MockIcuWordTable:
                     word = word_tokens[0]
                 for token in word_tokens:
                     cur.execute("""INSERT INTO word (word_id, word_token, type, word, info)
-                                      VALUES (%s, %s, 'H', %s, jsonb_build_object('lookup', %s::text))
+                                      VALUES (%s, %s, 'H', %s,
+                                              jsonb_build_object('lookup', %s::text))
                                 """, (word_id, token, word, word_tokens[0]))
 
         self.conn.commit()
 
-
     def count(self):
         return execute_scalar(self.conn, "SELECT count(*) FROM word")
 
-
     def count_special(self):
         return execute_scalar(self.conn, "SELECT count(*) FROM word WHERE type = 'S'")
 
-
     def count_housenumbers(self):
         return execute_scalar(self.conn, "SELECT count(*) FROM word WHERE type = 'H'")
 
-
     def get_special(self):
         with self.conn.cursor() as cur:
             cur.execute("SELECT word_token, info, word FROM word WHERE type = 'S'")
@@ -97,7 +91,6 @@ class MockIcuWordTable:
             assert len(result) == cur.rowcount, "Word table has duplicates."
             return result
 
-
     def get_country(self):
         with self.conn.cursor() as cur:
             cur.execute("SELECT word, word_token FROM word WHERE type = 'C'")
@@ -105,15 +98,12 @@ class MockIcuWordTable:
             assert len(result) == cur.rowcount, "Word table has duplicates."
             return result
 
-
     def get_postcodes(self):
         with self.conn.cursor() as cur:
             cur.execute("SELECT word FROM word WHERE type = 'P'")
             return set((row[0] for row in cur))
 
-
     def get_partial_words(self):
         with self.conn.cursor() as cur:
             cur.execute("SELECT word_token, info FROM word WHERE type ='w'")
             return set(((row[0], row[1]['count']) for row in cur))
-
diff --git a/test/python/mocks.py b/test/python/mocks.py
index cde0b7bb..fb7f4fa1 100644
--- a/test/python/mocks.py
+++ b/test/python/mocks.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Custom mocks for testing.
@@ -11,8 +11,6 @@ import itertools
 
 from nominatim_db.db import properties
 
-# This must always point to the mock word table for the default tokenizer.
-from mock_icu_word_table import MockIcuWordTable as MockWordTable
 
 class MockPlacexTable:
     """ A placex table for testing.
@@ -58,7 +56,8 @@ class MockPlacexTable:
                                                type, name, admin_level, address,
                                                housenumber, rank_search,
                                                extratags, geometry, country_code)
-                            VALUES(nextval('seq_place'), %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s)""",
+                            VALUES(nextval('seq_place'), %s, %s, %s, %s, %s, %s,
+                                   %s, %s, %s, %s, %s, %s)""",
                         (osm_type, osm_id or next(self.idseq), cls, typ, names,
                          admin_level, address, housenumber, rank_search,
                          extratags, 'SRID=4326;' + geom,
@@ -72,13 +71,11 @@ class MockPropertyTable:
     def __init__(self, conn):
         self.conn = conn
 
-
     def set(self, name, value):
         """ Set a property in the table to the given value.
         """
         properties.set_property(self.conn, name, value)
 
-
     def get(self, name):
         """ Set a property in the table to the given value.
         """
diff --git a/test/python/pytest.ini b/test/python/pytest.ini
index 15441de9..02fe3a86 100644
--- a/test/python/pytest.ini
+++ b/test/python/pytest.ini
@@ -1,3 +1,4 @@
 [pytest]
 markers =
-    sanitizer_params
\ No newline at end of file
+    sanitizer_params
+asyncio_default_fixture_loop_scope = function
diff --git a/test/python/tokenizer/sanitizers/test_clean_housenumbers.py b/test/python/tokenizer/sanitizers/test_clean_housenumbers.py
index 01fb162b..2dd10c56 100644
--- a/test/python/tokenizer/sanitizers/test_clean_housenumbers.py
+++ b/test/python/tokenizer/sanitizers/test_clean_housenumbers.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the sanitizer that normalizes housenumbers.
@@ -12,11 +12,12 @@ import pytest
 from nominatim_db.tokenizer.place_sanitizer import PlaceSanitizer
 from nominatim_db.data.place_info import PlaceInfo
 
+
 @pytest.fixture
 def sanitize(request, def_config):
     sanitizer_args = {'step': 'clean-housenumbers'}
     for mark in request.node.iter_markers(name="sanitizer_params"):
-        sanitizer_args.update({k.replace('_', '-') : v for k,v in mark.kwargs.items()})
+        sanitizer_args.update({k.replace('_', '-'): v for k, v in mark.kwargs.items()})
 
     def _run(**kwargs):
         place = PlaceInfo({'address': kwargs})
diff --git a/test/python/tokenizer/sanitizers/test_clean_postcodes.py b/test/python/tokenizer/sanitizers/test_clean_postcodes.py
index 70cc5256..242e9301 100644
--- a/test/python/tokenizer/sanitizers/test_clean_postcodes.py
+++ b/test/python/tokenizer/sanitizers/test_clean_postcodes.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the sanitizer that normalizes postcodes.
@@ -13,12 +13,13 @@ from nominatim_db.tokenizer.place_sanitizer import PlaceSanitizer
 from nominatim_db.data.place_info import PlaceInfo
 from nominatim_db.data import country_info
 
+
 @pytest.fixture
 def sanitize(def_config, request):
     country_info.setup_country_config(def_config)
     sanitizer_args = {'step': 'clean-postcodes'}
     for mark in request.node.iter_markers(name="sanitizer_params"):
-        sanitizer_args.update({k.replace('_', '-') : v for k,v in mark.kwargs.items()})
+        sanitizer_args.update({k.replace('_', '-'): v for k, v in mark.kwargs.items()})
 
     def _run(country=None, **kwargs):
         pi = {'address': kwargs}
diff --git a/test/python/tokenizer/sanitizers/test_clean_tiger_tags.py b/test/python/tokenizer/sanitizers/test_clean_tiger_tags.py
index 4badb57f..d245f4df 100644
--- a/test/python/tokenizer/sanitizers/test_clean_tiger_tags.py
+++ b/test/python/tokenizer/sanitizers/test_clean_tiger_tags.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for sanitizer that clean up TIGER tags.
@@ -12,16 +12,17 @@ import pytest
 from nominatim_db.tokenizer.place_sanitizer import PlaceSanitizer
 from nominatim_db.data.place_info import PlaceInfo
 
+
 class TestCleanTigerTags:
 
     @pytest.fixture(autouse=True)
     def setup_country(self, def_config):
         self.config = def_config
 
-
     def run_sanitizer_on(self, addr):
         place = PlaceInfo({'address': addr})
-        _, outaddr = PlaceSanitizer([{'step': 'clean-tiger-tags'}], self.config).process_names(place)
+        _, outaddr = PlaceSanitizer([{'step': 'clean-tiger-tags'}],
+                                    self.config).process_names(place)
 
         return sorted([(p.name, p.kind, p.suffix) for p in outaddr])
 
@@ -31,13 +32,11 @@ class TestCleanTigerTags:
         assert self.run_sanitizer_on({'tiger:county': inname})\
             == [(outname, 'county', 'tiger')]
 
-
     @pytest.mark.parametrize('name', ('Hamilton', 'Big, Road', ''))
     def test_badly_formatted(self, name):
         assert self.run_sanitizer_on({'tiger:county': name})\
             == [(name, 'county', 'tiger')]
 
-
     def test_unmatched(self):
         assert self.run_sanitizer_on({'tiger:country': 'US'})\
             == [('US', 'tiger', 'country')]
diff --git a/test/python/tokenizer/sanitizers/test_delete_tags.py b/test/python/tokenizer/sanitizers/test_delete_tags.py
index f9688c0b..9c8f2a90 100644
--- a/test/python/tokenizer/sanitizers/test_delete_tags.py
+++ b/test/python/tokenizer/sanitizers/test_delete_tags.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the sanitizer that normalizes housenumbers.
@@ -22,18 +22,15 @@ class TestWithDefault:
     def run_sanitizer_on(self, type, **kwargs):
 
         place = PlaceInfo({type: {k.replace('_', ':'): v for k, v in kwargs.items()},
-                            'country_code': 'de', 'rank_address': 30})
+                          'country_code': 'de', 'rank_address': 30})
 
         sanitizer_args = {'step': 'delete-tags'}
 
         name, address = PlaceSanitizer([sanitizer_args],
-                                    self.config).process_names(place)
-
-        return {
-                'name': sorted([(p.name, p.kind, p.suffix or '') for p in name]),
-                'address': sorted([(p.name, p.kind, p.suffix or '') for p in address])
-            }
+                                       self.config).process_names(place)
 
+        return {'name': sorted([(p.name, p.kind, p.suffix or '') for p in name]),
+                'address': sorted([(p.name, p.kind, p.suffix or '') for p in address])}
 
     def test_on_name(self):
         res = self.run_sanitizer_on('name', name='foo', ref='bar', ref_abc='baz')
@@ -44,7 +41,7 @@ class TestWithDefault:
         res = self.run_sanitizer_on('address', name='foo', ref='bar', ref_abc='baz')
 
         assert res.get('address') == [('bar', 'ref', ''), ('baz', 'ref', 'abc'),
-                                        ('foo', 'name', '')]
+                                      ('foo', 'name', '')]
 
 
 class TestTypeField:
@@ -56,15 +53,13 @@ class TestTypeField:
     def run_sanitizer_on(self, type, **kwargs):
 
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
-                            'country_code': 'de', 'rank_address': 30})
+                           'country_code': 'de', 'rank_address': 30})
 
-        sanitizer_args = {
-                        'step': 'delete-tags',
-                        'type': type,
-                    }
+        sanitizer_args = {'step': 'delete-tags',
+                          'type': type}
 
         name, _ = PlaceSanitizer([sanitizer_args],
-                                    self.config).process_names(place)
+                                 self.config).process_names(place)
 
         return sorted([(p.name, p.kind, p.suffix or '') for p in name])
 
@@ -77,7 +72,8 @@ class TestTypeField:
         res = self.run_sanitizer_on('address', name='foo', ref='bar', ref_abc='baz')
 
         assert res == [('bar', 'ref', ''), ('baz', 'ref', 'abc'),
-                        ('foo', 'name', '')]
+                       ('foo', 'name', '')]
+
 
 class TestFilterKind:
 
@@ -88,15 +84,13 @@ class TestFilterKind:
     def run_sanitizer_on(self, filt, **kwargs):
 
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
-                            'country_code': 'de', 'rank_address': 30})
+                           'country_code': 'de', 'rank_address': 30})
 
-        sanitizer_args = {
-                        'step': 'delete-tags',
-                        'filter-kind': filt,
-                    }
+        sanitizer_args = {'step': 'delete-tags',
+                          'filter-kind': filt}
 
         name, _ = PlaceSanitizer([sanitizer_args],
-                                    self.config).process_names(place)
+                                 self.config).process_names(place)
 
         return sorted([(p.name, p.kind, p.suffix or '') for p in name])
 
@@ -106,7 +100,6 @@ class TestFilterKind:
 
         assert res == [('bar', 'ref', 'abc'), ('foo', 'ref', '')]
 
-
     def test_single_pattern(self):
         res = self.run_sanitizer_on(['.*name'],
                                     name_fr='foo', ref_fr='foo', namexx_fr='bar',
@@ -114,7 +107,6 @@ class TestFilterKind:
 
         assert res == [('bar', 'namexx', 'fr'), ('foo', 'ref', 'fr')]
 
-
     def test_multiple_patterns(self):
         res = self.run_sanitizer_on(['.*name', 'ref'],
                                     name_fr='foo', ref_fr='foo', oldref_fr='foo',
@@ -132,19 +124,16 @@ class TestRankAddress:
     def run_sanitizer_on(self, rank_addr, **kwargs):
 
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
-                            'country_code': 'de', 'rank_address': 30})
+                           'country_code': 'de', 'rank_address': 30})
 
-        sanitizer_args = {
-                        'step': 'delete-tags',
-                        'rank_address': rank_addr
-                    }
+        sanitizer_args = {'step': 'delete-tags',
+                          'rank_address': rank_addr}
 
         name, _ = PlaceSanitizer([sanitizer_args],
-                                    self.config).process_names(place)
+                                 self.config).process_names(place)
 
         return sorted([(p.name, p.kind, p.suffix or '') for p in name])
 
-
     def test_single_rank(self):
         res = self.run_sanitizer_on('30', name='foo', ref='bar')
 
@@ -185,33 +174,29 @@ class TestSuffix:
     def run_sanitizer_on(self, suffix, **kwargs):
 
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
-                            'country_code': 'de', 'rank_address': 30})
+                           'country_code': 'de', 'rank_address': 30})
 
-        sanitizer_args = {
-                        'step': 'delete-tags',
-                        'suffix': suffix,
-                    }
+        sanitizer_args = {'step': 'delete-tags',
+                          'suffix': suffix}
 
         name, _ = PlaceSanitizer([sanitizer_args],
-                                    self.config).process_names(place)
+                                 self.config).process_names(place)
 
         return sorted([(p.name, p.kind, p.suffix or '') for p in name])
 
-
     def test_single_suffix(self):
         res = self.run_sanitizer_on('abc', name='foo', name_abc='foo',
-                                 name_pqr='bar', ref='bar', ref_abc='baz')
+                                    name_pqr='bar', ref='bar', ref_abc='baz')
 
         assert res == [('bar', 'name', 'pqr'), ('bar', 'ref', ''), ('foo', 'name', '')]
 
     def test_multiple_suffix(self):
         res = self.run_sanitizer_on(['abc.*', 'pqr'], name='foo', name_abcxx='foo',
-                                 ref_pqr='bar', name_pqrxx='baz')
+                                    ref_pqr='bar', name_pqrxx='baz')
 
         assert res == [('baz', 'name', 'pqrxx'), ('foo', 'name', '')]
 
 
-
 class TestCountryCodes:
 
     @pytest.fixture(autouse=True)
@@ -221,19 +206,16 @@ class TestCountryCodes:
     def run_sanitizer_on(self, country_code, **kwargs):
 
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
-                            'country_code': 'de', 'rank_address': 30})
+                           'country_code': 'de', 'rank_address': 30})
 
-        sanitizer_args = {
-                        'step': 'delete-tags',
-                        'country_code': country_code,
-                    }
+        sanitizer_args = {'step': 'delete-tags',
+                          'country_code': country_code}
 
         name, _ = PlaceSanitizer([sanitizer_args],
-                                    self.config).process_names(place)
+                                 self.config).process_names(place)
 
         return sorted([(p.name, p.kind) for p in name])
 
-
     def test_single_country_code_pass(self):
         res = self.run_sanitizer_on('de', name='foo', ref='bar')
 
@@ -259,6 +241,7 @@ class TestCountryCodes:
 
         assert res == [('bar', 'ref'), ('foo', 'name')]
 
+
 class TestAllParameters:
 
     @pytest.fixture(autouse=True)
@@ -268,7 +251,7 @@ class TestAllParameters:
     def run_sanitizer_on(self, country_code, rank_addr, suffix, **kwargs):
 
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
-                            'country_code': 'de', 'rank_address': 30})
+                           'country_code': 'de', 'rank_address': 30})
 
         sanitizer_args = {
                         'step': 'delete-tags',
@@ -281,11 +264,10 @@ class TestAllParameters:
                     }
 
         name, _ = PlaceSanitizer([sanitizer_args],
-                                    self.config).process_names(place)
+                                 self.config).process_names(place)
 
         return sorted([(p.name, p.kind, p.suffix or '') for p in name])
 
-
     def test_string_arguments_pass(self):
         res = self.run_sanitizer_on('de', '25-30', r'[\s\S]*',
                                     name='foo', ref='foo', name_abc='bar', ref_abc='baz')
diff --git a/test/python/tokenizer/sanitizers/test_sanitizer_config.py b/test/python/tokenizer/sanitizers/test_sanitizer_config.py
index 0497f21d..5dd2ec03 100644
--- a/test/python/tokenizer/sanitizers/test_sanitizer_config.py
+++ b/test/python/tokenizer/sanitizers/test_sanitizer_config.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for sanitizer configuration helper functions.
@@ -12,6 +12,7 @@ import pytest
 from nominatim_db.errors import UsageError
 from nominatim_db.tokenizer.sanitizers.config import SanitizerConfig
 
+
 def test_string_list_default_empty():
     assert SanitizerConfig().get_string_list('op') == []
 
@@ -53,7 +54,7 @@ def test_create_split_regex_no_params_unsplit(inp):
                                       ('ying;;yang', ['ying', 'yang']),
                                       (';a; ;c;d,', ['', 'a', '', 'c', 'd', '']),
                                       ('1,  3  ,5', ['1', '3', '5'])
-                                     ])
+                                      ])
 def test_create_split_regex_no_params_split(inp, outp):
     regex = SanitizerConfig().get_delimiter()
 
@@ -70,7 +71,7 @@ def test_create_split_regex_custom(delimiter):
 
 def test_create_split_regex_empty_delimiter():
     with pytest.raises(UsageError):
-        regex = SanitizerConfig({'delimiters': ''}).get_delimiter()
+        SanitizerConfig({'delimiters': ''}).get_delimiter()
 
 
 @pytest.mark.parametrize('inp', ('name', 'name:de', 'na\\me', '.*', ''))
@@ -96,12 +97,12 @@ def test_create_name_filter_no_param_default_fail_all(inp):
 
 def test_create_name_filter_no_param_default_invalid_string():
     with pytest.raises(ValueError):
-        filt = SanitizerConfig().get_filter('name', 'abc')
+        SanitizerConfig().get_filter('name', 'abc')
 
 
 def test_create_name_filter_no_param_default_empty_list():
     with pytest.raises(ValueError):
-        filt = SanitizerConfig().get_filter('name', [])
+        SanitizerConfig().get_filter('name', [])
 
 
 @pytest.mark.parametrize('kind', ('de', 'name:de', 'ende'))
@@ -121,7 +122,7 @@ def test_create_kind_filter_default_negetive(kind):
 @pytest.mark.parametrize('kind', ('lang', 'lang:de', 'langxx'))
 def test_create_kind_filter_custom_regex_positive(kind):
     filt = SanitizerConfig({'filter-kind': 'lang.*'}
-    ).get_filter('filter-kind', ['.*fr'])
+                           ).get_filter('filter-kind', ['.*fr'])
 
     assert filt(kind)
 
@@ -136,7 +137,7 @@ def test_create_kind_filter_custom_regex_negative(kind):
 @pytest.mark.parametrize('kind', ('name', 'fr', 'name:fr', 'frfr', '34'))
 def test_create_kind_filter_many_positive(kind):
     filt = SanitizerConfig({'filter-kind': ['.*fr', 'name', r'\d+']}
-    ).get_filter('filter-kind')
+                           ).get_filter('filter-kind')
 
     assert filt(kind)
 
@@ -144,6 +145,6 @@ def test_create_kind_filter_many_positive(kind):
 @pytest.mark.parametrize('kind', ('name:de', 'fridge', 'a34', '.*', '\\'))
 def test_create_kind_filter_many_negative(kind):
     filt = SanitizerConfig({'filter-kind': ['.*fr', 'name', r'\d+']}
-    ).get_filter('filter-kind')
+                           ).get_filter('filter-kind')
 
     assert not filt(kind)
diff --git a/test/python/tokenizer/sanitizers/test_split_name_list.py b/test/python/tokenizer/sanitizers/test_split_name_list.py
index fbfd72da..ec4869b3 100644
--- a/test/python/tokenizer/sanitizers/test_split_name_list.py
+++ b/test/python/tokenizer/sanitizers/test_split_name_list.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the sanitizer that splits multivalue lists.
@@ -14,20 +14,19 @@ from nominatim_db.data.place_info import PlaceInfo
 
 from nominatim_db.errors import UsageError
 
+
 class TestSplitName:
 
     @pytest.fixture(autouse=True)
     def setup_country(self, def_config):
         self.config = def_config
 
-
     def run_sanitizer_on(self, **kwargs):
         place = PlaceInfo({'name': kwargs})
         name, _ = PlaceSanitizer([{'step': 'split-name-list'}], self.config).process_names(place)
 
         return sorted([(p.name, p.kind, p.suffix) for p in name])
 
-
     def sanitize_with_delimiter(self, delimiter, name):
         place = PlaceInfo({'name': {'name': name}})
         san = PlaceSanitizer([{'step': 'split-name-list', 'delimiters': delimiter}],
@@ -36,12 +35,10 @@ class TestSplitName:
 
         return sorted([p.name for p in name])
 
-
     def test_simple(self):
         assert self.run_sanitizer_on(name='ABC') == [('ABC', 'name', None)]
         assert self.run_sanitizer_on(name='') == [('', 'name', None)]
 
-
     def test_splits(self):
         assert self.run_sanitizer_on(name='A;B;C') == [('A', 'name', None),
                                                        ('B', 'name', None),
@@ -49,7 +46,6 @@ class TestSplitName:
         assert self.run_sanitizer_on(short_name=' House, boat ') == [('House', 'short_name', None),
                                                                      ('boat', 'short_name', None)]
 
-
     def test_empty_fields(self):
         assert self.run_sanitizer_on(name='A;;B') == [('A', 'name', None),
                                                       ('B', 'name', None)]
@@ -58,14 +54,12 @@ class TestSplitName:
         assert self.run_sanitizer_on(name=' ;B') == [('B', 'name', None)]
         assert self.run_sanitizer_on(name='B,') == [('B', 'name', None)]
 
-
     def test_custom_delimiters(self):
         assert self.sanitize_with_delimiter(':', '12:45,3') == ['12', '45,3']
         assert self.sanitize_with_delimiter('\\', 'a;\\b!#@ \\') == ['a;', 'b!#@']
         assert self.sanitize_with_delimiter('[]', 'foo[to]be') == ['be', 'foo', 'to']
         assert self.sanitize_with_delimiter(' ', 'morning  sun') == ['morning', 'sun']
 
-
     def test_empty_delimiter_set(self):
         with pytest.raises(UsageError):
             self.sanitize_with_delimiter('', 'abc')
diff --git a/test/python/tokenizer/sanitizers/test_strip_brace_terms.py b/test/python/tokenizer/sanitizers/test_strip_brace_terms.py
index 6a4cffcf..6e891f9e 100644
--- a/test/python/tokenizer/sanitizers/test_strip_brace_terms.py
+++ b/test/python/tokenizer/sanitizers/test_strip_brace_terms.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the sanitizer that handles braced suffixes.
@@ -12,6 +12,7 @@ import pytest
 from nominatim_db.tokenizer.place_sanitizer import PlaceSanitizer
 from nominatim_db.data.place_info import PlaceInfo
 
+
 class TestStripBrace:
 
     @pytest.fixture(autouse=True)
@@ -24,23 +25,19 @@ class TestStripBrace:
 
         return sorted([(p.name, p.kind, p.suffix) for p in name])
 
-
     def test_no_braces(self):
         assert self.run_sanitizer_on(name='foo', ref='23') == [('23', 'ref', None),
                                                                ('foo', 'name', None)]
 
-
     def test_simple_braces(self):
-        assert self.run_sanitizer_on(name='Halle (Saale)', ref='3')\
-          == [('3', 'ref', None), ('Halle', 'name', None), ('Halle (Saale)', 'name', None)]
-        assert self.run_sanitizer_on(name='ack ( bar')\
-          == [('ack', 'name', None), ('ack ( bar', 'name', None)]
-
+        assert self.run_sanitizer_on(name='Halle (Saale)', ref='3') \
+            == [('3', 'ref', None), ('Halle', 'name', None), ('Halle (Saale)', 'name', None)]
+        assert self.run_sanitizer_on(name='ack ( bar') \
+            == [('ack', 'name', None), ('ack ( bar', 'name', None)]
 
     def test_only_braces(self):
         assert self.run_sanitizer_on(name='(maybe)') == [('(maybe)', 'name', None)]
 
-
     def test_double_braces(self):
         assert self.run_sanitizer_on(name='a((b))') == [('a', 'name', None),
                                                         ('a((b))', 'name', None)]
diff --git a/test/python/tokenizer/sanitizers/test_tag_analyzer_by_language.py b/test/python/tokenizer/sanitizers/test_tag_analyzer_by_language.py
index 2022e410..8f1d0540 100644
--- a/test/python/tokenizer/sanitizers/test_tag_analyzer_by_language.py
+++ b/test/python/tokenizer/sanitizers/test_tag_analyzer_by_language.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the sanitizer that enables language-dependent analyzers.
@@ -13,13 +13,13 @@ from nominatim_db.data.place_info import PlaceInfo
 from nominatim_db.tokenizer.place_sanitizer import PlaceSanitizer
 from nominatim_db.data.country_info import setup_country_config
 
+
 class TestWithDefaults:
 
     @pytest.fixture(autouse=True)
     def setup_country(self, def_config):
         self.config = def_config
 
-
     def run_sanitizer_on(self, country, **kwargs):
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
                            'country_code': country})
@@ -28,19 +28,16 @@ class TestWithDefaults:
 
         return sorted([(p.name, p.kind, p.suffix, p.attr) for p in name])
 
-
     def test_no_names(self):
         assert self.run_sanitizer_on('de') == []
 
-
     def test_simple(self):
-        res = self.run_sanitizer_on('fr', name='Foo',name_de='Zoo', ref_abc='M')
+        res = self.run_sanitizer_on('fr', name='Foo', name_de='Zoo', ref_abc='M')
 
         assert res == [('Foo', 'name', None, {}),
                        ('M', 'ref', 'abc', {'analyzer': 'abc'}),
                        ('Zoo', 'name', 'de', {'analyzer': 'de'})]
 
-
     @pytest.mark.parametrize('suffix', ['DE', 'asbc'])
     def test_illegal_suffix(self, suffix):
         assert self.run_sanitizer_on('fr', **{'name_' + suffix: 'Foo'}) \
@@ -53,7 +50,6 @@ class TestFilterKind:
     def setup_country(self, def_config):
         self.config = def_config
 
-
     def run_sanitizer_on(self, filt, **kwargs):
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
                            'country_code': 'de'})
@@ -63,17 +59,15 @@ class TestFilterKind:
 
         return sorted([(p.name, p.kind, p.suffix, p.attr) for p in name])
 
-
     def test_single_exact_name(self):
         res = self.run_sanitizer_on(['name'], name_fr='A', ref_fr='12',
-                                              shortname_fr='C', name='D')
+                                    shortname_fr='C', name='D')
 
         assert res == [('12', 'ref',  'fr', {}),
                        ('A',  'name', 'fr', {'analyzer': 'fr'}),
                        ('C',  'shortname', 'fr', {}),
                        ('D',  'name', None, {})]
 
-
     def test_single_pattern(self):
         res = self.run_sanitizer_on(['.*name'],
                                     name_fr='A', ref_fr='12', namexx_fr='B',
@@ -85,7 +79,6 @@ class TestFilterKind:
                        ('C',  'shortname', 'fr', {'analyzer': 'fr'}),
                        ('D',  'name', None, {})]
 
-
     def test_multiple_patterns(self):
         res = self.run_sanitizer_on(['.*name', 'ref'],
                                     name_fr='A', ref_fr='12', oldref_fr='X',
@@ -106,7 +99,6 @@ class TestDefaultCountry:
         setup_country_config(def_config)
         self.config = def_config
 
-
     def run_sanitizer_append(self, mode,  country, **kwargs):
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
                            'country_code': country})
@@ -122,7 +114,6 @@ class TestDefaultCountry:
 
         return sorted([(p.name, p.attr.get('analyzer', '')) for p in name])
 
-
     def run_sanitizer_replace(self, mode,  country, **kwargs):
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
                            'country_code': country})
@@ -138,7 +129,6 @@ class TestDefaultCountry:
 
         return sorted([(p.name, p.attr.get('analyzer', '')) for p in name])
 
-
     def test_missing_country(self):
         place = PlaceInfo({'name': {'name': 'something'}})
         name, _ = PlaceSanitizer([{'step': 'tag-analyzer-by-language',
@@ -151,59 +141,50 @@ class TestDefaultCountry:
         assert name[0].suffix is None
         assert 'analyzer' not in name[0].attr
 
-
     def test_mono_unknown_country(self):
         expect = [('XX', '')]
 
         assert self.run_sanitizer_replace('mono', 'xx', name='XX') == expect
         assert self.run_sanitizer_append('mono', 'xx', name='XX') == expect
 
-
     def test_mono_monoling_replace(self):
         res = self.run_sanitizer_replace('mono', 'de', name='Foo')
 
         assert res == [('Foo', 'de')]
 
-
     def test_mono_monoling_append(self):
         res = self.run_sanitizer_append('mono', 'de', name='Foo')
 
         assert res == [('Foo', ''), ('Foo', 'de')]
 
-
     def test_mono_multiling(self):
         expect = [('XX', '')]
 
         assert self.run_sanitizer_replace('mono', 'ch', name='XX') == expect
         assert self.run_sanitizer_append('mono', 'ch', name='XX') == expect
 
-
     def test_all_unknown_country(self):
         expect = [('XX', '')]
 
         assert self.run_sanitizer_replace('all', 'xx', name='XX') == expect
         assert self.run_sanitizer_append('all', 'xx', name='XX') == expect
 
-
     def test_all_monoling_replace(self):
         res = self.run_sanitizer_replace('all', 'de', name='Foo')
 
         assert res == [('Foo', 'de')]
 
-
     def test_all_monoling_append(self):
         res = self.run_sanitizer_append('all', 'de', name='Foo')
 
         assert res == [('Foo', ''), ('Foo', 'de')]
 
-
     def test_all_multiling_append(self):
         res = self.run_sanitizer_append('all', 'ch', name='XX')
 
         assert res == [('XX', ''),
                        ('XX', 'de'), ('XX', 'fr'), ('XX', 'it'), ('XX', 'rm')]
 
-
     def test_all_multiling_replace(self):
         res = self.run_sanitizer_replace('all', 'ch', name='XX')
 
@@ -216,7 +197,6 @@ class TestCountryWithWhitelist:
     def setup_country(self, def_config):
         self.config = def_config
 
-
     def run_sanitizer_on(self, mode,  country, **kwargs):
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()},
                            'country_code': country})
@@ -233,21 +213,17 @@ class TestCountryWithWhitelist:
 
         return sorted([(p.name, p.attr.get('analyzer', '')) for p in name])
 
-
     def test_mono_monoling(self):
         assert self.run_sanitizer_on('mono', 'de', name='Foo') == [('Foo', 'de')]
         assert self.run_sanitizer_on('mono', 'pt', name='Foo') == [('Foo', '')]
 
-
     def test_mono_multiling(self):
         assert self.run_sanitizer_on('mono', 'ca', name='Foo') == [('Foo', '')]
 
-
     def test_all_monoling(self):
         assert self.run_sanitizer_on('all', 'de', name='Foo') == [('Foo', 'de')]
         assert self.run_sanitizer_on('all', 'pt', name='Foo') == [('Foo', '')]
 
-
     def test_all_multiling(self):
         assert self.run_sanitizer_on('all', 'ca', name='Foo') == [('Foo', 'fr')]
         assert self.run_sanitizer_on('all', 'ch', name='Foo') \
@@ -260,7 +236,6 @@ class TestWhiteList:
     def setup_country(self, def_config):
         self.config = def_config
 
-
     def run_sanitizer_on(self, whitelist, **kwargs):
         place = PlaceInfo({'name': {k.replace('_', ':'): v for k, v in kwargs.items()}})
         name, _ = PlaceSanitizer([{'step': 'tag-analyzer-by-language',
@@ -275,14 +250,11 @@ class TestWhiteList:
 
         return sorted([(p.name, p.attr.get('analyzer', '')) for p in name])
 
-
     def test_in_whitelist(self):
         assert self.run_sanitizer_on(['de', 'xx'], ref_xx='123') == [('123', 'xx')]
 
-
     def test_not_in_whitelist(self):
         assert self.run_sanitizer_on(['de', 'xx'], ref_yy='123') == [('123', '')]
 
-
     def test_empty_whitelist(self):
         assert self.run_sanitizer_on([], ref_yy='123') == [('123', '')]
diff --git a/test/python/tokenizer/sanitizers/test_tag_japanese.py b/test/python/tokenizer/sanitizers/test_tag_japanese.py
index 08edbb56..6db7a3c3 100644
--- a/test/python/tokenizer/sanitizers/test_tag_japanese.py
+++ b/test/python/tokenizer/sanitizers/test_tag_japanese.py
@@ -2,86 +2,86 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
-from typing import Mapping, Optional, List
 import pytest
 
 from nominatim_db.data.place_info import PlaceInfo
-from nominatim_db.data.place_name import PlaceName
 from nominatim_db.tokenizer.place_sanitizer import PlaceSanitizer
 
+
 class TestTagJapanese:
     @pytest.fixture(autouse=True)
     def setup_country(self, def_config):
         self.config = def_config
 
-    def run_sanitizer_on(self,type, **kwargs):
+    def run_sanitizer_on(self, type, **kwargs):
         place = PlaceInfo({
             'address': kwargs,
             'country_code': 'jp'
         })
         sanitizer_args = {'step': 'tag-japanese'}
         _, address = PlaceSanitizer([sanitizer_args], self.config).process_names(place)
-        tmp_list = [(p.name,p.kind) for p in address]
+        tmp_list = [(p.name, p.kind) for p in address]
         return sorted(tmp_list)
 
     def test_on_address(self):
         res = self.run_sanitizer_on('address', name='foo', ref='bar', ref_abc='baz')
-        assert res == [('bar','ref'),('baz','ref_abc'),('foo','name')]
+        assert res == [('bar', 'ref'), ('baz', 'ref_abc'), ('foo', 'name')]
 
     def test_housenumber(self):
         res = self.run_sanitizer_on('address', housenumber='2')
-        assert res == [('2','housenumber')]
+        assert res == [('2', 'housenumber')]
 
     def test_blocknumber(self):
         res = self.run_sanitizer_on('address', block_number='6')
-        assert res == [('6','housenumber')]
+        assert res == [('6', 'housenumber')]
 
     def test_neighbourhood(self):
         res = self.run_sanitizer_on('address', neighbourhood='8')
-        assert res == [('8','place')]
+        assert res == [('8', 'place')]
 
     def test_quarter(self):
         res = self.run_sanitizer_on('address', quarter='kase')
-        assert res==[('kase','place')]
+        assert res == [('kase', 'place')]
 
     def test_housenumber_blocknumber(self):
         res = self.run_sanitizer_on('address', housenumber='2', block_number='6')
-        assert res == [('6-2','housenumber')]
+        assert res == [('6-2', 'housenumber')]
 
     def test_quarter_neighbourhood(self):
         res = self.run_sanitizer_on('address', quarter='kase', neighbourhood='8')
-        assert res == [('kase8','place')]
+        assert res == [('kase8', 'place')]
 
     def test_blocknumber_housenumber_quarter(self):
         res = self.run_sanitizer_on('address', block_number='6', housenumber='2', quarter='kase')
-        assert res == [('6-2','housenumber'),('kase','place')]
+        assert res == [('6-2', 'housenumber'), ('kase', 'place')]
 
     def test_blocknumber_housenumber_quarter_neighbourhood(self):
         res = self.run_sanitizer_on('address', block_number='6', housenumber='2', neighbourhood='8')
-        assert res == [('6-2','housenumber'),('8','place')]
+        assert res == [('6-2', 'housenumber'), ('8', 'place')]
 
     def test_blocknumber_quarter_neighbourhood(self):
-        res = self.run_sanitizer_on('address',block_number='6', quarter='kase', neighbourhood='8')
-        assert res == [('6','housenumber'),('kase8','place')]
+        res = self.run_sanitizer_on('address', block_number='6', quarter='kase', neighbourhood='8')
+        assert res == [('6', 'housenumber'), ('kase8', 'place')]
 
     def test_blocknumber_quarter(self):
-        res = self.run_sanitizer_on('address',block_number='6', quarter='kase')
-        assert res == [('6','housenumber'),('kase','place')]
+        res = self.run_sanitizer_on('address', block_number='6', quarter='kase')
+        assert res == [('6', 'housenumber'), ('kase', 'place')]
 
     def test_blocknumber_neighbourhood(self):
-        res = self.run_sanitizer_on('address',block_number='6', neighbourhood='8')
-        assert res == [('6','housenumber'),('8','place')]
+        res = self.run_sanitizer_on('address', block_number='6', neighbourhood='8')
+        assert res == [('6', 'housenumber'), ('8', 'place')]
 
     def test_housenumber_quarter_neighbourhood(self):
-        res = self.run_sanitizer_on('address',housenumber='2', quarter='kase', neighbourhood='8')
-        assert res == [('2','housenumber'),('kase8','place')]
+        res = self.run_sanitizer_on('address', housenumber='2', quarter='kase', neighbourhood='8')
+        assert res == [('2', 'housenumber'), ('kase8', 'place')]
 
     def test_housenumber_quarter(self):
-        res = self.run_sanitizer_on('address',housenumber='2', quarter='kase')
-        assert res == [('2','housenumber'),('kase','place')]
+        res = self.run_sanitizer_on('address', housenumber='2', quarter='kase')
+        assert res == [('2', 'housenumber'), ('kase', 'place')]
 
     def test_housenumber_blocknumber_neighbourhood_quarter(self):
-        res = self.run_sanitizer_on('address', block_number='6', housenumber='2', quarter='kase', neighbourhood='8')
-        assert res == [('6-2','housenumber'),('kase8','place')]
+        res = self.run_sanitizer_on('address', block_number='6', housenumber='2',
+                                    quarter='kase', neighbourhood='8')
+        assert res == [('6-2', 'housenumber'), ('kase8', 'place')]
diff --git a/test/python/tokenizer/test_factory.py b/test/python/tokenizer/test_factory.py
index 632dea88..106cdaaf 100644
--- a/test/python/tokenizer/test_factory.py
+++ b/test/python/tokenizer/test_factory.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for creating new tokenizers.
@@ -27,33 +27,14 @@ class TestFactory:
     def init_env(self, project_env, property_table, tokenizer_mock):
         self.config = project_env
 
-
     def test_setup_dummy_tokenizer(self, temp_db_conn):
         tokenizer = factory.create_tokenizer(self.config)
 
         assert isinstance(tokenizer, DummyTokenizer)
         assert tokenizer.init_state == "new"
-        assert (self.config.project_dir / 'tokenizer').is_dir()
 
         assert properties.get_property(temp_db_conn, 'tokenizer') == 'dummy'
 
-
-    def test_setup_tokenizer_dir_exists(self):
-        (self.config.project_dir / 'tokenizer').mkdir()
-
-        tokenizer = factory.create_tokenizer(self.config)
-
-        assert isinstance(tokenizer, DummyTokenizer)
-        assert tokenizer.init_state == "new"
-
-
-    def test_setup_tokenizer_dir_failure(self):
-        (self.config.project_dir / 'tokenizer').write_text("foo")
-
-        with pytest.raises(UsageError):
-            factory.create_tokenizer(self.config)
-
-
     def test_load_tokenizer(self):
         factory.create_tokenizer(self.config)
 
@@ -62,15 +43,12 @@ class TestFactory:
         assert isinstance(tokenizer, DummyTokenizer)
         assert tokenizer.init_state == "loaded"
 
-
     def test_load_repopulate_tokenizer_dir(self):
         factory.create_tokenizer(self.config)
 
         self.config.project_dir = self.config.project_dir
 
         factory.get_tokenizer_for_db(self.config)
-        assert (self.config.project_dir / 'tokenizer').exists()
-
 
     def test_load_missing_property(self, temp_db_cursor):
         factory.create_tokenizer(self.config)
diff --git a/test/python/tokenizer/test_icu.py b/test/python/tokenizer/test_icu.py
index a2bf6766..6d2e9ce7 100644
--- a/test/python/tokenizer/test_icu.py
+++ b/test/python/tokenizer/test_icu.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for ICU tokenizer.
@@ -20,6 +20,7 @@ from nominatim_db.data.place_info import PlaceInfo
 
 from mock_icu_word_table import MockIcuWordTable
 
+
 @pytest.fixture
 def word_table(temp_db_conn):
     return MockIcuWordTable(temp_db_conn)
@@ -38,12 +39,9 @@ def test_config(project_env, tmp_path):
 
 
 @pytest.fixture
-def tokenizer_factory(dsn, tmp_path, property_table,
-                      sql_preprocessor, place_table, word_table):
-    (tmp_path / 'tokenizer').mkdir()
-
+def tokenizer_factory(dsn, property_table, sql_preprocessor, place_table, word_table):
     def _maker():
-        return icu_tokenizer.create(dsn, tmp_path / 'tokenizer')
+        return icu_tokenizer.create(dsn)
 
     return _maker
 
@@ -89,6 +87,7 @@ def analyzer(tokenizer_factory, test_config, monkeypatch,
 
     return _mk_analyser
 
+
 @pytest.fixture
 def sql_functions(temp_db_conn, def_config, src_dir):
     orig_sql = def_config.lib_dir.sql
@@ -152,19 +151,19 @@ LANGUAGE plpgsql;
                               """)
 
 
-
 def test_init_new(tokenizer_factory, test_config, db_prop):
     tok = tokenizer_factory()
     tok.init_new_db(test_config)
 
-    assert db_prop(nominatim_db.tokenizer.icu_rule_loader.DBCFG_IMPORT_NORM_RULES) \
-            .startswith(':: lower ();')
+    prop = db_prop(nominatim_db.tokenizer.icu_rule_loader.DBCFG_IMPORT_NORM_RULES)
+
+    assert prop.startswith(':: lower ();')
 
 
 def test_init_word_table(tokenizer_factory, test_config, place_row, temp_db_cursor):
-    place_row(names={'name' : 'Test Area', 'ref' : '52'})
-    place_row(names={'name' : 'No Area'})
-    place_row(names={'name' : 'Holzstrasse'})
+    place_row(names={'name': 'Test Area', 'ref': '52'})
+    place_row(names={'name': 'No Area'})
+    place_row(names={'name': 'Holzstrasse'})
 
     tok = tokenizer_factory()
     tok.init_new_db(test_config)
@@ -228,19 +227,20 @@ def test_update_statistics(word_table, table_factory, temp_db_cursor,
                            tokenizer_factory, test_config):
     word_table.add_full_word(1000, 'hello')
     word_table.add_full_word(1001, 'bye')
+    word_table.add_full_word(1002, 'town')
     table_factory('search_name',
                   'place_id BIGINT, name_vector INT[], nameaddress_vector INT[]',
-                  [(12, [1000], [1001])])
+                  [(12, [1000], [1001]), (13, [1001], [1002]), (14, [1000, 1001], [1002])])
     tok = tokenizer_factory()
 
     tok.update_statistics(test_config)
 
-    assert temp_db_cursor.scalar("""SELECT count(*) FROM word
-                                    WHERE type = 'W' and word_id = 1000 and
-                                          (info->>'count')::int > 0""") == 1
-    assert temp_db_cursor.scalar("""SELECT count(*) FROM word
-                                    WHERE type = 'W' and word_id = 1001 and
-                                          (info->>'addr_count')::int > 0""") == 1
+    assert temp_db_cursor.row_set("""SELECT word_id,
+                                            (info->>'count')::int,
+                                            (info->>'addr_count')::int
+                                     FROM word
+                                     WHERE type = 'W'""") == \
+        {(1000, 2, None), (1001, 2, None), (1002, None, 2)}
 
 
 def test_normalize_postcode(analyzer):
@@ -259,61 +259,28 @@ class TestPostcodes:
             self.analyzer = anl
             yield anl
 
-
     def process_postcode(self, cc, postcode):
         return self.analyzer.process_place(PlaceInfo({'country_code': cc,
                                                       'address': {'postcode': postcode}}))
 
-
-    def test_update_postcodes_from_db_empty(self, table_factory, word_table):
-        table_factory('location_postcode', 'country_code TEXT, postcode TEXT',
-                      content=(('de', '12345'), ('se', '132 34'),
-                               ('bm', 'AB23'), ('fr', '12345')))
-
-        self.analyzer.update_postcodes_from_db()
-
-        assert word_table.count() == 5
-        assert word_table.get_postcodes() == {'12345', '132 34@132 34', 'AB 23@AB 23'}
-
-
-    def test_update_postcodes_from_db_ambigious(self, table_factory, word_table):
-        table_factory('location_postcode', 'country_code TEXT, postcode TEXT',
-                      content=(('in', '123456'), ('sg', '123456')))
-
-        self.analyzer.update_postcodes_from_db()
-
-        assert word_table.count() == 3
-        assert word_table.get_postcodes() == {'123456', '123456@123 456'}
-
-
-    def test_update_postcodes_from_db_add_and_remove(self, table_factory, word_table):
-        table_factory('location_postcode', 'country_code TEXT, postcode TEXT',
-                      content=(('ch', '1234'), ('bm', 'BC 45'), ('bm', 'XX45')))
+    def test_update_postcodes_deleted(self, word_table):
         word_table.add_postcode(' 1234', '1234')
         word_table.add_postcode(' 5678', '5678')
 
         self.analyzer.update_postcodes_from_db()
 
-        assert word_table.count() == 5
-        assert word_table.get_postcodes() == {'1234', 'BC 45@BC 45', 'XX 45@XX 45'}
-
+        assert word_table.count() == 0
 
     def test_process_place_postcode_simple(self, word_table):
         info = self.process_postcode('de', '12345')
 
         assert info['postcode'] == '12345'
 
-        assert word_table.get_postcodes() == {'12345', }
-
-
     def test_process_place_postcode_with_space(self, word_table):
         info = self.process_postcode('in', '123 567')
 
         assert info['postcode'] == '123567'
 
-        assert word_table.get_postcodes() == {'123567@123 567', }
-
-
 
 def test_update_special_phrase_empty_table(analyzer, word_table):
     with analyzer() as anl:
@@ -324,9 +291,9 @@ def test_update_special_phrase_empty_table(analyzer, word_table):
         ], True)
 
     assert word_table.get_special() \
-               == {('KÃNIG BEI', 'KÃ¶nig bei', 'amenity', 'royal', 'near'),
-                   ('KÃNIGE', 'KÃ¶nige', 'amenity', 'royal', None),
-                   ('STREET', 'street', 'highway', 'primary', 'in')}
+        == {('KÃNIG BEI', 'KÃ¶nig bei', 'amenity', 'royal', 'near'),
+            ('KÃNIGE', 'KÃ¶nige', 'amenity', 'royal', None),
+            ('STREET', 'street', 'highway', 'primary', 'in')}
 
 
 def test_update_special_phrase_delete_all(analyzer, word_table):
@@ -367,9 +334,9 @@ def test_update_special_phrase_modify(analyzer, word_table):
         ], True)
 
     assert word_table.get_special() \
-               == {('PRISON', 'prison', 'amenity', 'prison', 'in'),
-                   ('BAR', 'bar', 'highway', 'road', None),
-                   ('GARDEN', 'garden', 'leisure', 'garden', 'near')}
+        == {('PRISON', 'prison', 'amenity', 'prison', 'in'),
+            ('BAR', 'bar', 'highway', 'road', None),
+            ('GARDEN', 'garden', 'leisure', 'garden', 'near')}
 
 
 def test_add_country_names_new(analyzer, word_table):
@@ -398,7 +365,6 @@ class TestPlaceNames:
             self.analyzer = anl
             yield anl
 
-
     def expect_name_terms(self, info, *expected_terms):
         tokens = self.analyzer.get_word_token_info(expected_terms)
         for token in tokens:
@@ -406,34 +372,29 @@ class TestPlaceNames:
 
         assert eval(info['names']) == set((t[2] for t in tokens))
 
-
     def process_named_place(self, names):
         return self.analyzer.process_place(PlaceInfo({'name': names}))
 
-
     def test_simple_names(self):
         info = self.process_named_place({'name': 'Soft bAr', 'ref': '34'})
 
         self.expect_name_terms(info, '#Soft bAr', '#34', 'Soft', 'bAr', '34')
 
-
-    @pytest.mark.parametrize('sep', [',' , ';'])
+    @pytest.mark.parametrize('sep', [',', ';'])
     def test_names_with_separator(self, sep):
         info = self.process_named_place({'name': sep.join(('New York', 'Big Apple'))})
 
         self.expect_name_terms(info, '#New York', '#Big Apple',
                                      'new', 'york', 'big', 'apple')
 
-
     def test_full_names_with_bracket(self):
         info = self.process_named_place({'name': 'Houseboat (left)'})
 
         self.expect_name_terms(info, '#Houseboat (left)', '#Houseboat',
                                      'houseboat', 'left')
 
-
     def test_country_name(self, word_table):
-        place = PlaceInfo({'name' : {'name': 'Norge'},
+        place = PlaceInfo({'name': {'name': 'Norge'},
                            'country_code': 'no',
                            'rank_address': 4,
                            'class': 'boundary',
@@ -455,18 +416,15 @@ class TestPlaceAddress:
             self.analyzer = anl
             yield anl
 
-
     @pytest.fixture
     def getorcreate_hnr_id(self, temp_db_cursor):
         temp_db_cursor.execute("""CREATE OR REPLACE FUNCTION getorcreate_hnr_id(lookup_term TEXT)
                                   RETURNS INTEGER AS $$
                                     SELECT -nextval('seq_word')::INTEGER; $$ LANGUAGE SQL""")
 
-
     def process_address(self, **kwargs):
         return self.analyzer.process_place(PlaceInfo({'address': kwargs}))
 
-
     def name_token_set(self, *expected_terms):
         tokens = self.analyzer.get_word_token_info(expected_terms)
         for token in tokens:
@@ -474,13 +432,11 @@ class TestPlaceAddress:
 
         return set((t[2] for t in tokens))
 
-
     @pytest.mark.parametrize('pcode', ['12345', 'AB 123', '34-345'])
     def test_process_place_postcode(self, word_table, pcode):
-        self.process_address(postcode=pcode)
-
-        assert word_table.get_postcodes() == {pcode, }
+        info = self.process_address(postcode=pcode)
 
+        assert info['postcode'] == pcode
 
     @pytest.mark.parametrize('hnr', ['123a', '1', '101'])
     def test_process_place_housenumbers_simple(self, hnr, getorcreate_hnr_id):
@@ -489,7 +445,6 @@ class TestPlaceAddress:
         assert info['hnr'] == hnr.upper()
         assert info['hnr_tokens'] == "{-1}"
 
-
     def test_process_place_housenumbers_duplicates(self, getorcreate_hnr_id):
         info = self.process_address(housenumber='134',
                                     conscriptionnumber='134',
@@ -498,7 +453,6 @@ class TestPlaceAddress:
         assert set(info['hnr'].split(';')) == set(('134', '99A'))
         assert info['hnr_tokens'] == "{-1,-2}"
 
-
     def test_process_place_housenumbers_cached(self, getorcreate_hnr_id):
         info = self.process_address(housenumber="45")
         assert info['hnr_tokens'] == "{-1}"
@@ -512,37 +466,32 @@ class TestPlaceAddress:
         info = self.process_address(housenumber="41")
         assert eval(info['hnr_tokens']) == {-3}
 
-
     def test_process_place_street(self):
-        self.analyzer.process_place(PlaceInfo({'name': {'name' : 'Grand Road'}}))
+        self.analyzer.process_place(PlaceInfo({'name': {'name': 'Grand Road'}}))
         info = self.process_address(street='Grand Road')
 
         assert eval(info['street']) == self.name_token_set('#Grand Road')
 
-
     def test_process_place_nonexisting_street(self):
         info = self.process_address(street='Grand Road')
 
         assert info['street'] == '{}'
 
-
     def test_process_place_multiple_street_tags(self):
-        self.analyzer.process_place(PlaceInfo({'name': {'name' : 'Grand Road',
+        self.analyzer.process_place(PlaceInfo({'name': {'name': 'Grand Road',
                                                         'ref': '05989'}}))
         info = self.process_address(**{'street': 'Grand Road',
-                                      'street:sym_ul': '05989'})
+                                       'street:sym_ul': '05989'})
 
         assert eval(info['street']) == self.name_token_set('#Grand Road', '#05989')
 
-
     def test_process_place_street_empty(self):
         info = self.process_address(street='ðµ')
 
         assert info['street'] == '{}'
 
-
     def test_process_place_street_from_cache(self):
-        self.analyzer.process_place(PlaceInfo({'name': {'name' : 'Grand Road'}}))
+        self.analyzer.process_place(PlaceInfo({'name': {'name': 'Grand Road'}}))
         self.process_address(street='Grand Road')
 
         # request address again
@@ -550,25 +499,21 @@ class TestPlaceAddress:
 
         assert eval(info['street']) == self.name_token_set('#Grand Road')
 
-
     def test_process_place_place(self):
         info = self.process_address(place='Honu Lulu')
 
         assert eval(info['place']) == self.name_token_set('HONU', 'LULU', '#HONU LULU')
 
-
     def test_process_place_place_extra(self):
         info = self.process_address(**{'place:en': 'Honu Lulu'})
 
         assert 'place' not in info
 
-
     def test_process_place_place_empty(self):
         info = self.process_address(place='ðµ')
 
         assert 'place' not in info
 
-
     def test_process_place_address_terms(self):
         info = self.process_address(country='de', city='Zwickau', state='Sachsen',
                                     suburb='Zwickau', street='Hauptstr',
@@ -577,19 +522,17 @@ class TestPlaceAddress:
         city = self.name_token_set('ZWICKAU', '#ZWICKAU')
         state = self.name_token_set('SACHSEN', '#SACHSEN')
 
-        result = {k: eval(v) for k,v in info['addr'].items()}
+        result = {k: eval(v) for k, v in info['addr'].items()}
 
         assert result == {'city': city, 'suburb': city, 'state': state}
 
-
     def test_process_place_multiple_address_terms(self):
         info = self.process_address(**{'city': 'Bruxelles', 'city:de': 'BrÃ¼ssel'})
 
-        result = {k: eval(v) for k,v in info['addr'].items()}
+        result = {k: eval(v) for k, v in info['addr'].items()}
 
         assert result == {'city': self.name_token_set('Bruxelles', '#Bruxelles')}
 
-
     def test_process_place_address_terms_empty(self):
         info = self.process_address(country='de', city=' ', street='Hauptstr',
                                     full='right behind the church')
@@ -603,22 +546,21 @@ class TestPlaceHousenumberWithAnalyser:
     def setup(self, analyzer, sql_functions):
         hnr = {'step': 'clean-housenumbers',
                'filter-kind': ['housenumber', 'conscriptionnumber', 'streetnumber']}
-        with analyzer(trans=(":: upper()", "'ðµ' > ' '"), sanitizers=[hnr], with_housenumber=True) as anl:
+        with analyzer(trans=(":: upper()", "'ðµ' > ' '"), sanitizers=[hnr],
+                      with_housenumber=True) as anl:
             self.analyzer = anl
             yield anl
 
-
     @pytest.fixture
     def getorcreate_hnr_id(self, temp_db_cursor):
-        temp_db_cursor.execute("""CREATE OR REPLACE FUNCTION create_analyzed_hnr_id(norm_term TEXT, lookup_terms TEXT[])
-                                  RETURNS INTEGER AS $$
-                                    SELECT -nextval('seq_word')::INTEGER; $$ LANGUAGE SQL""")
-
+        temp_db_cursor.execute("""
+            CREATE OR REPLACE FUNCTION create_analyzed_hnr_id(norm_term TEXT, lookup_terms TEXT[])
+            RETURNS INTEGER AS $$
+                SELECT -nextval('seq_word')::INTEGER; $$ LANGUAGE SQL""")
 
     def process_address(self, **kwargs):
         return self.analyzer.process_place(PlaceInfo({'address': kwargs}))
 
-
     def name_token_set(self, *expected_terms):
         tokens = self.analyzer.get_word_token_info(expected_terms)
         for token in tokens:
@@ -626,7 +568,6 @@ class TestPlaceHousenumberWithAnalyser:
 
         return set((t[2] for t in tokens))
 
-
     @pytest.mark.parametrize('hnr', ['123 a', '1', '101'])
     def test_process_place_housenumbers_simple(self, hnr, getorcreate_hnr_id):
         info = self.process_address(housenumber=hnr)
@@ -634,7 +575,6 @@ class TestPlaceHousenumberWithAnalyser:
         assert info['hnr'] == hnr.upper()
         assert info['hnr_tokens'] == "{-1}"
 
-
     def test_process_place_housenumbers_duplicates(self, getorcreate_hnr_id):
         info = self.process_address(housenumber='134',
                                     conscriptionnumber='134',
@@ -643,7 +583,6 @@ class TestPlaceHousenumberWithAnalyser:
         assert set(info['hnr'].split(';')) == set(('134', '99 A'))
         assert info['hnr_tokens'] == "{-1,-2}"
 
-
     def test_process_place_housenumbers_cached(self, getorcreate_hnr_id):
         info = self.process_address(housenumber="45")
         assert info['hnr_tokens'] == "{-1}"
@@ -665,7 +604,6 @@ class TestUpdateWordTokens:
         table_factory('search_name', 'place_id BIGINT, name_vector INT[]')
         self.tok = tokenizer_factory()
 
-
     @pytest.fixture
     def search_entry(self, temp_db_cursor):
         place_id = itertools.count(1000)
@@ -676,7 +614,6 @@ class TestUpdateWordTokens:
 
         return _insert
 
-
     @pytest.fixture(params=['simple', 'analyzed'])
     def add_housenumber(self, request, word_table):
         if request.param == 'simple':
@@ -688,7 +625,6 @@ class TestUpdateWordTokens:
 
         return _make
 
-
     @pytest.mark.parametrize('hnr', ('1a', '1234567', '34 5'))
     def test_remove_unused_housenumbers(self, add_housenumber, word_table, hnr):
         word_table.add_housenumber(1000, hnr)
@@ -697,7 +633,6 @@ class TestUpdateWordTokens:
         self.tok.update_word_tokens()
         assert word_table.count_housenumbers() == 0
 
-
     def test_keep_unused_numeral_housenumbers(self, add_housenumber, word_table):
         add_housenumber(1000, '5432')
 
@@ -705,8 +640,8 @@ class TestUpdateWordTokens:
         self.tok.update_word_tokens()
         assert word_table.count_housenumbers() == 1
 
-
-    def test_keep_housenumbers_from_search_name_table(self, add_housenumber, word_table, search_entry):
+    def test_keep_housenumbers_from_search_name_table(self, add_housenumber,
+                                                      word_table, search_entry):
         add_housenumber(9999, '5432a')
         add_housenumber(9991, '9 a')
         search_entry(123, 9999, 34)
@@ -715,8 +650,8 @@ class TestUpdateWordTokens:
         self.tok.update_word_tokens()
         assert word_table.count_housenumbers() == 1
 
-
-    def test_keep_housenumbers_from_placex_table(self, add_housenumber, word_table, placex_table):
+    def test_keep_housenumbers_from_placex_table(self, add_housenumber, word_table,
+                                                 placex_table):
         add_housenumber(9999, '5432a')
         add_housenumber(9990, '34z')
         placex_table.add(housenumber='34z')
@@ -726,8 +661,8 @@ class TestUpdateWordTokens:
         self.tok.update_word_tokens()
         assert word_table.count_housenumbers() == 1
 
-
-    def test_keep_housenumbers_from_placex_table_hnr_list(self, add_housenumber, word_table, placex_table):
+    def test_keep_housenumbers_from_placex_table_hnr_list(self, add_housenumber,
+                                                          word_table, placex_table):
         add_housenumber(9991, '9 b')
         add_housenumber(9990, '34z')
         placex_table.add(housenumber='9 a;9 b;9 c')
diff --git a/test/python/tokenizer/test_icu_rule_loader.py b/test/python/tokenizer/test_icu_rule_loader.py
index a3fae758..f26b84c2 100644
--- a/test/python/tokenizer/test_icu_rule_loader.py
+++ b/test/python/tokenizer/test_icu_rule_loader.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for converting a config file to ICU rules.
@@ -19,17 +19,16 @@ from icu import Transliterator
 
 CONFIG_SECTIONS = ('normalization', 'transliteration', 'token-analysis')
 
+
 class TestIcuRuleLoader:
 
     @pytest.fixture(autouse=True)
     def init_env(self, project_env):
         self.project_env = project_env
 
-
     def write_config(self, content):
         (self.project_env.project_dir / 'icu_tokenizer.yaml').write_text(dedent(content))
 
-
     def config_rules(self, *variants):
         content = dedent("""\
         normalization:
@@ -49,14 +48,12 @@ class TestIcuRuleLoader:
         content += '\n'.join(("             - " + s for s in variants)) + '\n'
         self.write_config(content)
 
-
     def get_replacements(self, *variants):
         self.config_rules(*variants)
         loader = ICURuleLoader(self.project_env)
         rules = loader.analysis[None].config['replacements']
 
-        return sorted((k, sorted(v)) for k,v in rules)
-
+        return sorted((k, sorted(v)) for k, v in rules)
 
     def test_empty_rule_set(self):
         self.write_config("""\
@@ -72,16 +69,14 @@ class TestIcuRuleLoader:
         assert rules.get_normalization_rules() == ''
         assert rules.get_transliteration_rules() == ''
 
-
     @pytest.mark.parametrize("section", CONFIG_SECTIONS)
     def test_missing_section(self, section):
-        rule_cfg = { s: [] for s in CONFIG_SECTIONS if s != section}
+        rule_cfg = {s: [] for s in CONFIG_SECTIONS if s != section}
         self.write_config(yaml.dump(rule_cfg))
 
         with pytest.raises(UsageError):
             ICURuleLoader(self.project_env)
 
-
     def test_get_search_rules(self):
         self.config_rules()
         loader = ICURuleLoader(self.project_env)
@@ -97,7 +92,6 @@ class TestIcuRuleLoader:
         assert trans.transliterate(" ÎÎ¸Î®Î½Î± ") == " athÄna "
         assert trans.transliterate(" Ð¿ÑÐ¾ÑÐ¿ÐµÐºÑ ") == " prospekt "
 
-
     def test_get_normalization_rules(self):
         self.config_rules()
         loader = ICURuleLoader(self.project_env)
@@ -106,7 +100,6 @@ class TestIcuRuleLoader:
 
         assert trans.transliterate(" Ð¿ÑÐ¾ÑÐ¿ÐµÐºÑ-Prospekt ") == " Ð¿ÑÐ¾ÑÐ¿ÐµÐºÑ prospekt "
 
-
     def test_get_transliteration_rules(self):
         self.config_rules()
         loader = ICURuleLoader(self.project_env)
@@ -115,7 +108,6 @@ class TestIcuRuleLoader:
 
         assert trans.transliterate(" Ð¿ÑÐ¾ÑÐ¿ÐµÐºÑ-Prospekt ") == " prospekt Prospekt "
 
-
     def test_transliteration_rules_from_file(self):
         self.write_config("""\
             normalization:
@@ -135,7 +127,6 @@ class TestIcuRuleLoader:
 
         assert trans.transliterate(" axxt ") == " byt "
 
-
     def test_search_rules(self):
         self.config_rules('~street => s,st', 'master => mstr')
         proc = ICURuleLoader(self.project_env).make_token_analysis()
@@ -144,7 +135,6 @@ class TestIcuRuleLoader:
         assert proc.search.transliterate('Earnes St').strip() == 'earnes st'
         assert proc.search.transliterate('Nostreet').strip() == 'nostreet'
 
-
     @pytest.mark.parametrize("variant", ['foo > bar', 'foo -> bar -> bar',
                                          '~foo~ -> bar', 'fo~ o -> bar'])
     def test_invalid_variant_description(self, variant):
@@ -157,25 +147,21 @@ class TestIcuRuleLoader:
 
         assert repl == [(' foo ', [' bar', ' foo'])]
 
-
     def test_replace_full(self):
         repl = self.get_replacements("foo => bar")
 
         assert repl == [(' foo ', [' bar'])]
 
-
     def test_add_suffix_no_decompose(self):
         repl = self.get_replacements("~berg |-> bg")
 
         assert repl == [(' berg ', [' berg', ' bg']),
                         ('berg ', ['berg', 'bg'])]
 
-
     def test_replace_suffix_no_decompose(self):
         repl = self.get_replacements("~berg |=> bg")
 
-        assert repl == [(' berg ', [' bg']),('berg ', ['bg'])]
-
+        assert repl == [(' berg ', [' bg']), ('berg ', ['bg'])]
 
     def test_add_suffix_decompose(self):
         repl = self.get_replacements("~berg -> bg")
@@ -183,26 +169,22 @@ class TestIcuRuleLoader:
         assert repl == [(' berg ', [' berg', ' bg', 'berg', 'bg']),
                         ('berg ', [' berg', ' bg', 'berg', 'bg'])]
 
-
     def test_replace_suffix_decompose(self):
         repl = self.get_replacements("~berg => bg")
 
         assert repl == [(' berg ', [' bg', 'bg']),
                         ('berg ', [' bg', 'bg'])]
 
-
     def test_add_prefix_no_compose(self):
         repl = self.get_replacements("hinter~ |-> hnt")
 
         assert repl == [(' hinter', [' hinter', ' hnt']),
                         (' hinter ', [' hinter', ' hnt'])]
 
-
     def test_replace_prefix_no_compose(self):
         repl = self.get_replacements("hinter~ |=> hnt")
 
-        assert repl ==  [(' hinter', [' hnt']), (' hinter ', [' hnt'])]
-
+        assert repl == [(' hinter', [' hnt']), (' hinter ', [' hnt'])]
 
     def test_add_prefix_compose(self):
         repl = self.get_replacements("hinter~-> h")
@@ -210,45 +192,38 @@ class TestIcuRuleLoader:
         assert repl == [(' hinter', [' h', ' h ', ' hinter', ' hinter ']),
                         (' hinter ', [' h', ' h', ' hinter', ' hinter'])]
 
-
     def test_replace_prefix_compose(self):
         repl = self.get_replacements("hinter~=> h")
 
         assert repl == [(' hinter', [' h', ' h ']),
                         (' hinter ', [' h', ' h'])]
 
-
     def test_add_beginning_only(self):
         repl = self.get_replacements("^Premier -> Pr")
 
         assert repl == [('^ premier ', ['^ pr', '^ premier'])]
 
-
     def test_replace_beginning_only(self):
         repl = self.get_replacements("^Premier => Pr")
 
         assert repl == [('^ premier ', ['^ pr'])]
 
-
     def test_add_final_only(self):
         repl = self.get_replacements("road$ -> rd")
 
         assert repl == [(' road ^', [' rd ^', ' road ^'])]
 
-
     def test_replace_final_only(self):
         repl = self.get_replacements("road$ => rd")
 
         assert repl == [(' road ^', [' rd ^'])]
 
-
     def test_decompose_only(self):
         repl = self.get_replacements("~foo -> foo")
 
         assert repl == [(' foo ', [' foo', 'foo']),
                         ('foo ', [' foo', 'foo'])]
 
-
     def test_add_suffix_decompose_end_only(self):
         repl = self.get_replacements("~berg |-> bg", "~berg$ -> bg")
 
@@ -257,7 +232,6 @@ class TestIcuRuleLoader:
                         ('berg ', ['berg', 'bg']),
                         ('berg ^', [' berg ^', ' bg ^', 'berg ^', 'bg ^'])]
 
-
     def test_replace_suffix_decompose_end_only(self):
         repl = self.get_replacements("~berg |=> bg", "~berg$ => bg")
 
@@ -266,7 +240,6 @@ class TestIcuRuleLoader:
                         ('berg ', ['bg']),
                         ('berg ^', [' bg ^', 'bg ^'])]
 
-
     def test_add_multiple_suffix(self):
         repl = self.get_replacements("~berg,~burg -> bg")
 
diff --git a/test/python/tokenizer/test_place_sanitizer.py b/test/python/tokenizer/test_place_sanitizer.py
index 25844459..fcf02bd3 100644
--- a/test/python/tokenizer/test_place_sanitizer.py
+++ b/test/python/tokenizer/test_place_sanitizer.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for execution of the sanitztion step.
@@ -50,13 +50,13 @@ def test_placeinfo_has_attr():
 def test_sanitizer_default(def_config):
     san = sanitizer.PlaceSanitizer([{'step': 'split-name-list'}], def_config)
 
-    name, address =  san.process_names(PlaceInfo({'name': {'name:de:de': '1;2;3'},
-                                                  'address': {'street': 'Bald'}}))
+    name, address = san.process_names(PlaceInfo({'name': {'name:de:de': '1;2;3'},
+                                                 'address': {'street': 'Bald'}}))
 
     assert len(name) == 3
     assert all(isinstance(n, sanitizer.PlaceName) for n in name)
-    assert all(n.kind == 'name'  for n in name)
-    assert all(n.suffix == 'de:de'  for n in name)
+    assert all(n.kind == 'name' for n in name)
+    assert all(n.suffix == 'de:de' for n in name)
 
     assert len(address) == 1
     assert all(isinstance(n, sanitizer.PlaceName) for n in address)
@@ -66,7 +66,7 @@ def test_sanitizer_default(def_config):
 def test_sanitizer_empty_list(def_config, rules):
     san = sanitizer.PlaceSanitizer(rules, def_config)
 
-    name, address =  san.process_names(PlaceInfo({'name': {'name:de:de': '1;2;3'}}))
+    name, address = san.process_names(PlaceInfo({'name': {'name:de:de': '1;2;3'}}))
 
     assert len(name) == 1
     assert all(isinstance(n, sanitizer.PlaceName) for n in name)
@@ -74,4 +74,4 @@ def test_sanitizer_empty_list(def_config, rules):
 
 def test_sanitizer_missing_step_definition(def_config):
     with pytest.raises(UsageError):
-        san = sanitizer.PlaceSanitizer([{'id': 'split-name-list'}], def_config)
+        sanitizer.PlaceSanitizer([{'id': 'split-name-list'}], def_config)
diff --git a/test/python/tokenizer/token_analysis/test_analysis_postcodes.py b/test/python/tokenizer/token_analysis/test_analysis_postcodes.py
index 870c8a5d..1eb15a50 100644
--- a/test/python/tokenizer/token_analysis/test_analysis_postcodes.py
+++ b/test/python/tokenizer/token_analysis/test_analysis_postcodes.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for special postcode analysis and variant generation.
@@ -13,7 +13,6 @@ from icu import Transliterator
 
 import nominatim_db.tokenizer.token_analysis.postcodes as module
 from nominatim_db.data.place_name import PlaceName
-from nominatim_db.errors import UsageError
 
 DEFAULT_NORMALIZATION = """ :: NFD ();
                             'ð³' > ' ';
@@ -27,9 +26,10 @@ DEFAULT_TRANSLITERATION = """ ::  Latin ();
                               'ðµ' > ' ';
                           """
 
+
 @pytest.fixture
 def analyser():
-    rules = { 'analyzer': 'postcodes'}
+    rules = {'analyzer': 'postcodes'}
     config = module.configure(rules, DEFAULT_NORMALIZATION)
 
     trans = Transliterator.createFromRules("test_trans", DEFAULT_TRANSLITERATION)
diff --git a/test/python/tokenizer/token_analysis/test_generic.py b/test/python/tokenizer/token_analysis/test_generic.py
index 191f551f..48f2483b 100644
--- a/test/python/tokenizer/token_analysis/test_generic.py
+++ b/test/python/tokenizer/token_analysis/test_generic.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for import name normalisation and variant generation.
@@ -26,8 +26,9 @@ DEFAULT_TRANSLITERATION = """ ::  Latin ();
                               'ðµ' > ' ';
                           """
 
+
 def make_analyser(*variants, variant_only=False):
-    rules = { 'analyzer': 'generic', 'variants': [{'words': variants}]}
+    rules = {'analyzer': 'generic', 'variants': [{'words': variants}]}
     if variant_only:
         rules['mode'] = 'variant-only'
     trans = Transliterator.createFromRules("test_trans", DEFAULT_TRANSLITERATION)
@@ -39,11 +40,11 @@ def make_analyser(*variants, variant_only=False):
 
 def get_normalized_variants(proc, name):
     norm = Transliterator.createFromRules("test_norm", DEFAULT_NORMALIZATION)
-    return proc.compute_variants(norm.transliterate(name).strip())
+    return proc.compute_variants(norm.transliterate(name).strip())[0]
 
 
 def test_no_variants():
-    rules = { 'analyzer': 'generic' }
+    rules = {'analyzer': 'generic'}
     trans = Transliterator.createFromRules("test_trans", DEFAULT_TRANSLITERATION)
     norm = Transliterator.createFromRules("test_norm", DEFAULT_NORMALIZATION)
     config = module.configure(rules, norm, trans)
@@ -62,35 +63,36 @@ def test_variants_empty():
 
 
 VARIANT_TESTS = [
-(('~strasse,~straÃe -> str', '~weg => weg'), "hallo", {'hallo'}),
-(('weg => wg',), "holzweg", {'holzweg'}),
-(('weg -> wg',), "holzweg", {'holzweg'}),
-(('~weg => weg',), "holzweg", {'holz weg', 'holzweg'}),
-(('~weg -> weg',), "holzweg",  {'holz weg', 'holzweg'}),
-(('~weg => w',), "holzweg", {'holz w', 'holzw'}),
-(('~weg -> w',), "holzweg",  {'holz weg', 'holzweg', 'holz w', 'holzw'}),
-(('~weg => weg',), "Meier Weg", {'meier weg', 'meierweg'}),
-(('~weg -> weg',), "Meier Weg", {'meier weg', 'meierweg'}),
-(('~weg => w',), "Meier Weg", {'meier w', 'meierw'}),
-(('~weg -> w',), "Meier Weg", {'meier weg', 'meierweg', 'meier w', 'meierw'}),
-(('weg => wg',), "Meier Weg", {'meier wg'}),
-(('weg -> wg',), "Meier Weg", {'meier weg', 'meier wg'}),
-(('~strasse,~straÃe -> str', '~weg => weg'), "BauwegstraÃe",
+    (('~strasse,~straÃe -> str', '~weg => weg'), "hallo", {'hallo'}),
+    (('weg => wg',), "holzweg", {'holzweg'}),
+    (('weg -> wg',), "holzweg", {'holzweg'}),
+    (('~weg => weg',), "holzweg", {'holz weg', 'holzweg'}),
+    (('~weg -> weg',), "holzweg",  {'holz weg', 'holzweg'}),
+    (('~weg => w',), "holzweg", {'holz w', 'holzw'}),
+    (('~weg -> w',), "holzweg",  {'holz weg', 'holzweg', 'holz w', 'holzw'}),
+    (('~weg => weg',), "Meier Weg", {'meier weg', 'meierweg'}),
+    (('~weg -> weg',), "Meier Weg", {'meier weg', 'meierweg'}),
+    (('~weg => w',), "Meier Weg", {'meier w', 'meierw'}),
+    (('~weg -> w',), "Meier Weg", {'meier weg', 'meierweg', 'meier w', 'meierw'}),
+    (('weg => wg',), "Meier Weg", {'meier wg'}),
+    (('weg -> wg',), "Meier Weg", {'meier weg', 'meier wg'}),
+    (('~strasse,~straÃe -> str', '~weg => weg'), "BauwegstraÃe",
      {'bauweg straÃe', 'bauweg str', 'bauwegstraÃe', 'bauwegstr'}),
-(('am => a', 'bach => b'), "am bach", {'a b'}),
-(('am => a', '~bach => b'), "am bach", {'a b'}),
-(('am -> a', '~bach -> b'), "am bach", {'am bach', 'a bach', 'am b', 'a b'}),
-(('am -> a', '~bach -> b'), "ambach", {'ambach', 'am bach', 'amb', 'am b'}),
-(('saint -> s,st', 'street -> st'), "Saint Johns Street",
+    (('am => a', 'bach => b'), "am bach", {'a b'}),
+    (('am => a', '~bach => b'), "am bach", {'a b'}),
+    (('am -> a', '~bach -> b'), "am bach", {'am bach', 'a bach', 'am b', 'a b'}),
+    (('am -> a', '~bach -> b'), "ambach", {'ambach', 'am bach', 'amb', 'am b'}),
+    (('saint -> s,st', 'street -> st'), "Saint Johns Street",
      {'saint johns street', 's johns street', 'st johns street',
       'saint johns st', 's johns st', 'st johns st'}),
-(('river$ -> r',), "River Bend Road", {'river bend road'}),
-(('river$ -> r',), "Bent River", {'bent river', 'bent r'}),
-(('^north => n',), "North 2nd Street", {'n 2nd street'}),
-(('^north => n',), "Airport North", {'airport north'}),
-(('am -> a',), "am am am am am am am am", {'am am am am am am am am'}),
-(('am => a',), "am am am am am am am am", {'a a a a a a a a'})
-]
+    (('river$ -> r',), "River Bend Road", {'river bend road'}),
+    (('river$ -> r',), "Bent River", {'bent river', 'bent r'}),
+    (('^north => n',), "North 2nd Street", {'n 2nd street'}),
+    (('^north => n',), "Airport North", {'airport north'}),
+    (('am -> a',), "am am am am am am am am", {'am am am am am am am am'}),
+    (('am => a',), "am am am am am am am am", {'a a a a a a a a'})
+    ]
+
 
 @pytest.mark.parametrize("rules,name,variants", VARIANT_TESTS)
 def test_variants(rules, name, variants):
@@ -103,10 +105,11 @@ def test_variants(rules, name, variants):
 
 
 VARIANT_ONLY_TESTS = [
-(('weg => wg',), "hallo", set()),
-(('weg => wg',), "Meier Weg", {'meier wg'}),
-(('weg -> wg',), "Meier Weg", {'meier wg'}),
-]
+    (('weg => wg',), "hallo", set()),
+    (('weg => wg',), "Meier Weg", {'meier wg'}),
+    (('weg -> wg',), "Meier Weg", {'meier wg'}),
+    ]
+
 
 @pytest.mark.parametrize("rules,name,variants", VARIANT_ONLY_TESTS)
 def test_variants_only(rules, name, variants):
@@ -122,17 +125,15 @@ class TestGetReplacements:
 
     @staticmethod
     def configure_rules(*variants):
-        rules = { 'analyzer': 'generic', 'variants': [{'words': variants}]}
+        rules = {'analyzer': 'generic', 'variants': [{'words': variants}]}
         trans = Transliterator.createFromRules("test_trans", DEFAULT_TRANSLITERATION)
         norm = Transliterator.createFromRules("test_norm", DEFAULT_NORMALIZATION)
         return module.configure(rules, norm, trans)
 
-
     def get_replacements(self, *variants):
         config = self.configure_rules(*variants)
 
-        return sorted((k, sorted(v)) for k,v in config['replacements'])
-
+        return sorted((k, sorted(v)) for k, v in config['replacements'])
 
     @pytest.mark.parametrize("variant", ['foo > bar', 'foo -> bar -> bar',
                                          '~foo~ -> bar', 'fo~ o -> bar'])
@@ -140,38 +141,32 @@ class TestGetReplacements:
         with pytest.raises(UsageError):
             self.configure_rules(variant)
 
-
     @pytest.mark.parametrize("rule", ["!!! -> bar", "bar => !!!"])
     def test_ignore_unnormalizable_terms(self, rule):
         repl = self.get_replacements(rule)
 
         assert repl == []
 
-
     def test_add_full(self):
         repl = self.get_replacements("foo -> bar")
 
         assert repl == [(' foo ', [' bar', ' foo'])]
 
-
     def test_replace_full(self):
         repl = self.get_replacements("foo => bar")
 
         assert repl == [(' foo ', [' bar'])]
 
-
     def test_add_suffix_no_decompose(self):
         repl = self.get_replacements("~berg |-> bg")
 
         assert repl == [(' berg ', [' berg', ' bg']),
                         ('berg ', ['berg', 'bg'])]
 
-
     def test_replace_suffix_no_decompose(self):
         repl = self.get_replacements("~berg |=> bg")
 
-        assert repl == [(' berg ', [' bg']),('berg ', ['bg'])]
-
+        assert repl == [(' berg ', [' bg']), ('berg ', ['bg'])]
 
     def test_add_suffix_decompose(self):
         repl = self.get_replacements("~berg -> bg")
@@ -179,26 +174,22 @@ class TestGetReplacements:
         assert repl == [(' berg ', [' berg', ' bg', 'berg', 'bg']),
                         ('berg ', [' berg', ' bg', 'berg', 'bg'])]
 
-
     def test_replace_suffix_decompose(self):
         repl = self.get_replacements("~berg => bg")
 
         assert repl == [(' berg ', [' bg', 'bg']),
                         ('berg ', [' bg', 'bg'])]
 
-
     def test_add_prefix_no_compose(self):
         repl = self.get_replacements("hinter~ |-> hnt")
 
         assert repl == [(' hinter', [' hinter', ' hnt']),
                         (' hinter ', [' hinter', ' hnt'])]
 
-
     def test_replace_prefix_no_compose(self):
         repl = self.get_replacements("hinter~ |=> hnt")
 
-        assert repl ==  [(' hinter', [' hnt']), (' hinter ', [' hnt'])]
-
+        assert repl == [(' hinter', [' hnt']), (' hinter ', [' hnt'])]
 
     def test_add_prefix_compose(self):
         repl = self.get_replacements("hinter~-> h")
@@ -206,45 +197,38 @@ class TestGetReplacements:
         assert repl == [(' hinter', [' h', ' h ', ' hinter', ' hinter ']),
                         (' hinter ', [' h', ' h', ' hinter', ' hinter'])]
 
-
     def test_replace_prefix_compose(self):
         repl = self.get_replacements("hinter~=> h")
 
         assert repl == [(' hinter', [' h', ' h ']),
                         (' hinter ', [' h', ' h'])]
 
-
     def test_add_beginning_only(self):
         repl = self.get_replacements("^Premier -> Pr")
 
         assert repl == [('^ premier ', ['^ pr', '^ premier'])]
 
-
     def test_replace_beginning_only(self):
         repl = self.get_replacements("^Premier => Pr")
 
         assert repl == [('^ premier ', ['^ pr'])]
 
-
     def test_add_final_only(self):
         repl = self.get_replacements("road$ -> rd")
 
         assert repl == [(' road ^', [' rd ^', ' road ^'])]
 
-
     def test_replace_final_only(self):
         repl = self.get_replacements("road$ => rd")
 
         assert repl == [(' road ^', [' rd ^'])]
 
-
     def test_decompose_only(self):
         repl = self.get_replacements("~foo -> foo")
 
         assert repl == [(' foo ', [' foo', 'foo']),
                         ('foo ', [' foo', 'foo'])]
 
-
     def test_add_suffix_decompose_end_only(self):
         repl = self.get_replacements("~berg |-> bg", "~berg$ -> bg")
 
@@ -253,7 +237,6 @@ class TestGetReplacements:
                         ('berg ', ['berg', 'bg']),
                         ('berg ^', [' berg ^', ' bg ^', 'berg ^', 'bg ^'])]
 
-
     def test_replace_suffix_decompose_end_only(self):
         repl = self.get_replacements("~berg |=> bg", "~berg$ => bg")
 
@@ -262,7 +245,6 @@ class TestGetReplacements:
                         ('berg ', ['bg']),
                         ('berg ^', [' bg ^', 'bg ^'])]
 
-
     @pytest.mark.parametrize('rule', ["~berg,~burg -> bg",
                                       "~berg, ~burg -> bg",
                                       "~berg,,~burg -> bg"])
diff --git a/test/python/tokenizer/token_analysis/test_generic_mutation.py b/test/python/tokenizer/token_analysis/test_generic_mutation.py
index 7d0db925..e0507e4c 100644
--- a/test/python/tokenizer/token_analysis/test_generic_mutation.py
+++ b/test/python/tokenizer/token_analysis/test_generic_mutation.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for generic token analysis, mutation part.
@@ -24,37 +24,34 @@ DEFAULT_TRANSLITERATION = """ ::  Latin ();
                               'ðµ' > ' ';
                           """
 
+
 class TestMutationNoVariants:
 
     def make_analyser(self, *mutations):
-        rules = { 'analyzer': 'generic',
-                  'mutations': [ {'pattern': m[0], 'replacements': m[1]}
-                                 for m in mutations]
-                }
+        rules = {'analyzer': 'generic',
+                 'mutations': [{'pattern': m[0], 'replacements': m[1]}
+                               for m in mutations]
+                 }
         trans = Transliterator.createFromRules("test_trans", DEFAULT_TRANSLITERATION)
         norm = Transliterator.createFromRules("test_norm", DEFAULT_NORMALIZATION)
         config = module.configure(rules, norm, trans)
 
         self.analysis = module.create(norm, trans, config)
 
-
     def variants(self, name):
         norm = Transliterator.createFromRules("test_norm", DEFAULT_NORMALIZATION)
-        return set(self.analysis.compute_variants(norm.transliterate(name).strip()))
-
+        return set(self.analysis.compute_variants(norm.transliterate(name).strip())[0])
 
     @pytest.mark.parametrize('pattern', ('(capture)', ['a list']))
     def test_bad_pattern(self, pattern):
         with pytest.raises(UsageError):
             self.make_analyser((pattern, ['b']))
 
-
     @pytest.mark.parametrize('replacements', (None, 'a string'))
     def test_bad_replacement(self, replacements):
         with pytest.raises(UsageError):
             self.make_analyser(('a', replacements))
 
-
     def test_simple_replacement(self):
         self.make_analyser(('a', ['b']))
 
@@ -62,27 +59,23 @@ class TestMutationNoVariants:
         assert self.variants('abba') == {'bbbb'}
         assert self.variants('2 aar') == {'2 bbr'}
 
-
     def test_multichar_replacement(self):
         self.make_analyser(('1 1', ['1 1 1']))
 
         assert self.variants('1 1456') == {'1 1 1456'}
         assert self.variants('1 1 1') == {'1 1 1 1'}
 
-
     def test_removement_replacement(self):
         self.make_analyser((' ', [' ', '']))
 
         assert self.variants('A 345') == {'a 345', 'a345'}
         assert self.variants('a g b') == {'a g b', 'ag b', 'a gb', 'agb'}
 
-
     def test_regex_pattern(self):
         self.make_analyser(('[^a-z]+', ['XXX', ' ']))
 
         assert self.variants('a-34n12') == {'aXXXnXXX', 'aXXXn', 'a nXXX', 'a n'}
 
-
     def test_multiple_mutations(self):
         self.make_analyser(('Ã¤', ['Ã¤', 'ae']), ('Ã¶', ['Ã¶', 'oe']))
 
diff --git a/test/python/tokenizer/token_analysis/test_simple_trie.py b/test/python/tokenizer/token_analysis/test_simple_trie.py
new file mode 100644
index 00000000..6ce66580
--- /dev/null
+++ b/test/python/tokenizer/token_analysis/test_simple_trie.py
@@ -0,0 +1,39 @@
+# SPDX-License-Identifier: GPL-3.0-or-later
+#
+# This file is part of Nominatim. (https://nominatim.org)
+#
+# Copyright (C) 2025 by the Nominatim developer community.
+# For a full list of authors see the git log.
+"""
+Tests for simplified trie structure.
+"""
+
+from nominatim_db.tokenizer.token_analysis.simple_trie import SimpleTrie
+
+
+def test_single_item_trie():
+    t = SimpleTrie([('foob', 42)])
+
+    assert t.longest_prefix('afoobar') == (None, 0)
+    assert t.longest_prefix('afoobar', start=1) == (42, 5)
+    assert t.longest_prefix('foob') == (42, 4)
+    assert t.longest_prefix('123foofoo', 3) == (None, 3)
+
+
+def test_complex_item_tree():
+    t = SimpleTrie([('a', 1),
+                    ('b', 2),
+                    ('auto', 3),
+                    ('buto', 4),
+                    ('automat', 5),
+                    ('bu', 6),
+                    ('bx', 7)])
+
+    assert t.longest_prefix('a') == (1, 1)
+    assert t.longest_prefix('au') == (1, 1)
+    assert t.longest_prefix('aut') == (1, 1)
+    assert t.longest_prefix('auto') == (3, 4)
+    assert t.longest_prefix('automat') == (5, 7)
+    assert t.longest_prefix('automatx') == (5, 7)
+    assert t.longest_prefix('butomat') == (4, 4)
+    assert t.longest_prefix('butomat', 1) == (None, 1)
diff --git a/test/python/tools/conftest.py b/test/python/tools/conftest.py
index 0098747e..dc9346c8 100644
--- a/test/python/tools/conftest.py
+++ b/test/python/tools/conftest.py
@@ -2,10 +2,11 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 import pytest
 
+
 @pytest.fixture
 def osm2pgsql_options(temp_db, tmp_path):
     """ A standard set of options for osm2pgsql
diff --git a/test/python/tools/test_add_osm_data.py b/test/python/tools/test_add_osm_data.py
index c5aaaaae..38cf87c4 100644
--- a/test/python/tools/test_add_osm_data.py
+++ b/test/python/tools/test_add_osm_data.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for functions to add additional data to the database.
@@ -13,6 +13,7 @@ import pytest
 
 from nominatim_db.tools import add_osm_data
 
+
 class CaptureGetUrl:
 
     def __init__(self, monkeypatch):
@@ -29,6 +30,7 @@ def setup_delete_postprocessing(temp_db_cursor):
     temp_db_cursor.execute("""CREATE OR REPLACE FUNCTION flush_deleted_places()
                               RETURNS INTEGER AS $$ SELECT 1 $$ LANGUAGE SQL""")
 
+
 def test_import_osm_file_simple(dsn, table_factory, osm2pgsql_options, capfd):
 
     assert add_osm_data.add_data_from_file(dsn, Path('change.osm'), osm2pgsql_options) == 0
diff --git a/test/python/tools/test_admin.py b/test/python/tools/test_admin.py
index 1e1f0e29..e758bca2 100644
--- a/test/python/tools/test_admin.py
+++ b/test/python/tools/test_admin.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for maintenance and analysis functions.
@@ -14,6 +14,7 @@ from nominatim_db.tools import admin
 from nominatim_db.tokenizer import factory
 from nominatim_db.db.sql_preprocessor import SQLPreprocessor
 
+
 @pytest.fixture(autouse=True)
 def create_placex_table(project_env, tokenizer_mock, temp_db_cursor, placex_table):
     """ All tests in this module require the placex table to be set up.
@@ -76,7 +77,8 @@ def test_analyse_indexing_with_osm_id(project_env, temp_db_cursor):
 class TestAdminCleanDeleted:
 
     @pytest.fixture(autouse=True)
-    def setup_polygon_delete(self, project_env, table_factory, place_table, osmline_table, temp_db_cursor, temp_db_conn, def_config, src_dir):
+    def setup_polygon_delete(self, project_env, table_factory, place_table,
+                             osmline_table, temp_db_cursor, temp_db_conn, def_config, src_dir):
         """ Set up place_force_delete function and related tables
         """
         self.project_env = project_env
@@ -87,12 +89,14 @@ class TestAdminCleanDeleted:
                       class TEXT NOT NULL,
                       type TEXT NOT NULL""",
                       ((100, 'N', 'boundary', 'administrative'),
-                      (145, 'N', 'boundary', 'administrative'),
-                      (175, 'R', 'landcover', 'grass')))
-        temp_db_cursor.execute("""INSERT INTO placex (place_id, osm_id, osm_type, class, type, indexed_date, indexed_status)
-                              VALUES(1, 100, 'N', 'boundary', 'administrative', current_date - INTERVAL '1 month', 1),
-                               (2, 145, 'N', 'boundary', 'administrative', current_date - INTERVAL '3 month', 1),
-                               (3, 175, 'R', 'landcover', 'grass', current_date - INTERVAL '3 months', 1)""")
+                       (145, 'N', 'boundary', 'administrative'),
+                       (175, 'R', 'landcover', 'grass')))
+        temp_db_cursor.execute("""
+            INSERT INTO placex (place_id, osm_id, osm_type, class, type,
+                                indexed_date, indexed_status)
+            VALUES(1, 100, 'N', 'boundary', 'administrative', current_date - INTERVAL '1 month', 1),
+                  (2, 145, 'N', 'boundary', 'administrative', current_date - INTERVAL '3 month', 1),
+                  (3, 175, 'R', 'landcover', 'grass', current_date - INTERVAL '3 months', 1)""")
         # set up tables and triggers for utils function
         table_factory('place_to_be_deleted',
                       """osm_id BIGINT,
@@ -116,33 +120,42 @@ class TestAdminCleanDeleted:
         sqlproc = SQLPreprocessor(temp_db_conn, def_config)
         sqlproc.run_sql_file(temp_db_conn, 'functions/utils.sql')
         def_config.lib_dir.sql = orig_sql
-        
 
     def test_admin_clean_deleted_no_records(self):
         admin.clean_deleted_relations(self.project_env, age='1 year')
-        assert self.temp_db_cursor.row_set('SELECT osm_id, osm_type, class, type, indexed_status FROM placex') == {(100, 'N', 'boundary', 'administrative', 1),
-                                                                                                                   (145, 'N', 'boundary', 'administrative', 1),
-                                                                                                                   (175, 'R', 'landcover', 'grass', 1)}
-        assert self.temp_db_cursor.table_rows('import_polygon_delete') == 3
 
+        rowset = self.temp_db_cursor.row_set(
+            'SELECT osm_id, osm_type, class, type, indexed_status FROM placex')
+
+        assert rowset == {(100, 'N', 'boundary', 'administrative', 1),
+                          (145, 'N', 'boundary', 'administrative', 1),
+                          (175, 'R', 'landcover', 'grass', 1)}
+        assert self.temp_db_cursor.table_rows('import_polygon_delete') == 3
 
     @pytest.mark.parametrize('test_age', ['T week', '1 welk', 'P1E'])
     def test_admin_clean_deleted_bad_age(self, test_age):
         with pytest.raises(UsageError):
-            admin.clean_deleted_relations(self.project_env, age = test_age)
-
+            admin.clean_deleted_relations(self.project_env, age=test_age)
 
     def test_admin_clean_deleted_partial(self):
-        admin.clean_deleted_relations(self.project_env, age = '2 months')
-        assert self.temp_db_cursor.row_set('SELECT osm_id, osm_type, class, type, indexed_status FROM placex') == {(100, 'N', 'boundary', 'administrative', 1),
-                                                                                                                   (145, 'N', 'boundary', 'administrative', 100),
-                                                                                                                   (175, 'R', 'landcover', 'grass', 100)}
+        admin.clean_deleted_relations(self.project_env, age='2 months')
+
+        rowset = self.temp_db_cursor.row_set(
+            'SELECT osm_id, osm_type, class, type, indexed_status FROM placex')
+
+        assert rowset == {(100, 'N', 'boundary', 'administrative', 1),
+                          (145, 'N', 'boundary', 'administrative', 100),
+                          (175, 'R', 'landcover', 'grass', 100)}
         assert self.temp_db_cursor.table_rows('import_polygon_delete') == 1
 
     @pytest.mark.parametrize('test_age', ['1 week', 'P3D', '5 hours'])
     def test_admin_clean_deleted(self, test_age):
-        admin.clean_deleted_relations(self.project_env, age = test_age)
-        assert self.temp_db_cursor.row_set('SELECT osm_id, osm_type, class, type, indexed_status FROM placex') == {(100, 'N', 'boundary', 'administrative', 100),
-                                                                                                                   (145, 'N', 'boundary', 'administrative', 100),
-                                                                                                                   (175, 'R', 'landcover', 'grass', 100)}
+        admin.clean_deleted_relations(self.project_env, age=test_age)
+
+        rowset = self.temp_db_cursor.row_set(
+            'SELECT osm_id, osm_type, class, type, indexed_status FROM placex')
+
+        assert rowset == {(100, 'N', 'boundary', 'administrative', 100),
+                          (145, 'N', 'boundary', 'administrative', 100),
+                          (175, 'R', 'landcover', 'grass', 100)}
         assert self.temp_db_cursor.table_rows('import_polygon_delete') == 0
diff --git a/test/python/tools/test_check_database.py b/test/python/tools/test_check_database.py
index 886bd75b..66506f56 100644
--- a/test/python/tools/test_check_database.py
+++ b/test/python/tools/test_check_database.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for database integrity checks.
@@ -12,6 +12,7 @@ import pytest
 from nominatim_db.tools import check_database as chkdb
 import nominatim_db.version
 
+
 def test_check_database_unknown_db(def_config, monkeypatch):
     monkeypatch.setenv('NOMINATIM_DATABASE_DSN', 'pgsql:dbname=fjgkhughwgh2423gsags')
     assert chkdb.check_database(def_config) == 1
@@ -35,6 +36,7 @@ def test_check_database_version_good(property_table, temp_db_conn, def_config):
                        str(nominatim_db.version.NOMINATIM_VERSION))
     assert chkdb.check_database_version(temp_db_conn, def_config) == chkdb.CheckState.OK
 
+
 def test_check_database_version_bad(property_table, temp_db_conn, def_config):
     property_table.set('database_version', '3.9.9-9')
     assert chkdb.check_database_version(temp_db_conn, def_config) == chkdb.CheckState.FATAL
diff --git a/test/python/tools/test_database_import.py b/test/python/tools/test_database_import.py
index df204298..f8cea2cc 100644
--- a/test/python/tools/test_database_import.py
+++ b/test/python/tools/test_database_import.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for functions to import a new database.
@@ -10,13 +10,14 @@ Tests for functions to import a new database.
 from pathlib import Path
 
 import pytest
-import pytest_asyncio
+import pytest_asyncio  # noqa
 import psycopg
 from psycopg import sql as pysql
 
 from nominatim_db.tools import database_import
 from nominatim_db.errors import UsageError
 
+
 class TestDatabaseSetup:
     DBNAME = 'test_nominatim_python_unittest'
 
@@ -31,18 +32,15 @@ class TestDatabaseSetup:
             with conn.cursor() as cur:
                 cur.execute(f'DROP DATABASE IF EXISTS {self.DBNAME}')
 
-
     @pytest.fixture
     def cursor(self):
         with psycopg.connect(dbname=self.DBNAME) as conn:
             with conn.cursor() as cur:
                 yield cur
 
-
     def conn(self):
         return psycopg.connect(dbname=self.DBNAME)
 
-
     def test_setup_skeleton(self):
         database_import.setup_database_skeleton(f'dbname={self.DBNAME}')
 
@@ -51,25 +49,21 @@ class TestDatabaseSetup:
             with conn.cursor() as cur:
                 cur.execute('CREATE TABLE t (h HSTORE, geom GEOMETRY(Geometry, 4326))')
 
-
     def test_unsupported_pg_version(self, monkeypatch):
         monkeypatch.setattr(database_import, 'POSTGRESQL_REQUIRED_VERSION', (100, 4))
 
         with pytest.raises(UsageError, match='PostgreSQL server is too old.'):
             database_import.setup_database_skeleton(f'dbname={self.DBNAME}')
 
-
     def test_create_db_explicit_ro_user(self):
         database_import.setup_database_skeleton(f'dbname={self.DBNAME}',
                                                 rouser='postgres')
 
-
     def test_create_db_missing_ro_user(self):
         with pytest.raises(UsageError, match='Missing read-only user.'):
             database_import.setup_database_skeleton(f'dbname={self.DBNAME}',
                                                     rouser='sdfwkjkjgdugu2;jgsafkljas;')
 
-
     def test_setup_extensions_old_postgis(self, monkeypatch):
         monkeypatch.setattr(database_import, 'POSTGIS_REQUIRED_VERSION', (50, 50))
 
@@ -173,7 +167,7 @@ def test_truncate_database_tables(temp_db_conn, temp_db_cursor, table_factory, w
 @pytest.mark.parametrize("threads", (1, 5))
 @pytest.mark.asyncio
 async def test_load_data(dsn, place_row, placex_table, osmline_table,
-                   temp_db_cursor, threads):
+                         temp_db_cursor, threads):
     for func in ('precompute_words', 'getorcreate_housenumber_id', 'make_standard_name'):
         temp_db_cursor.execute(pysql.SQL("""CREATE FUNCTION {} (src TEXT)
                                             RETURNS TEXT AS $$ SELECT 'a'::TEXT $$ LANGUAGE SQL
@@ -198,11 +192,9 @@ class TestSetupSQL:
 
         self.config = def_config
 
-
     def write_sql(self, fname, content):
         (self.config.lib_dir.sql / fname).write_text(content)
 
-
     @pytest.mark.parametrize("reverse", [True, False])
     def test_create_tables(self, temp_db_conn, temp_db_cursor, reverse):
         self.write_sql('tables.sql',
@@ -213,7 +205,6 @@ class TestSetupSQL:
 
         temp_db_cursor.scalar('SELECT test()') == reverse
 
-
     def test_create_table_triggers(self, temp_db_conn, temp_db_cursor):
         self.write_sql('table-triggers.sql',
                        """CREATE FUNCTION test() RETURNS TEXT
@@ -223,7 +214,6 @@ class TestSetupSQL:
 
         temp_db_cursor.scalar('SELECT test()') == 'a'
 
-
     def test_create_partition_tables(self, temp_db_conn, temp_db_cursor):
         self.write_sql('partition-tables.src.sql',
                        """CREATE FUNCTION test() RETURNS TEXT
@@ -233,7 +223,6 @@ class TestSetupSQL:
 
         temp_db_cursor.scalar('SELECT test()') == 'b'
 
-
     @pytest.mark.parametrize("drop", [True, False])
     @pytest.mark.asyncio
     async def test_create_search_indices(self, temp_db_conn, temp_db_cursor, drop):
diff --git a/test/python/tools/test_exec_utils.py b/test/python/tools/test_exec_utils.py
index 666ef0b8..216f1a40 100644
--- a/test/python/tools/test_exec_utils.py
+++ b/test/python/tools/test_exec_utils.py
@@ -2,19 +2,14 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for tools.exec_utils module.
 """
-from pathlib import Path
-import subprocess
-
-import pytest
-
-from nominatim_db.config import Configuration
 import nominatim_db.tools.exec_utils as exec_utils
 
+
 def test_run_osm2pgsql(osm2pgsql_options):
     osm2pgsql_options['append'] = False
     osm2pgsql_options['import_file'] = 'foo.bar'
diff --git a/test/python/tools/test_freeze.py b/test/python/tools/test_freeze.py
index f64850fb..21e49b8d 100644
--- a/test/python/tools/test_freeze.py
+++ b/test/python/tools/test_freeze.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for freeze functions (removing unused database parts).
@@ -26,6 +26,7 @@ NOMINATIM_DROP_TABLES = [
     'wikipedia_article', 'wikipedia_redirect'
 ]
 
+
 def test_drop_tables(temp_db_conn, temp_db_cursor, table_factory):
     for table in NOMINATIM_RUNTIME_TABLES + NOMINATIM_DROP_TABLES:
         table_factory(table)
@@ -42,6 +43,7 @@ def test_drop_tables(temp_db_conn, temp_db_cursor, table_factory):
 
     assert freeze.is_frozen(temp_db_conn)
 
+
 def test_drop_flatnode_file_no_file():
     freeze.drop_flatnode_file(None)
 
diff --git a/test/python/tools/test_import_special_phrases.py b/test/python/tools/test_import_special_phrases.py
index 0d33e6e0..c676c40a 100644
--- a/test/python/tools/test_import_special_phrases.py
+++ b/test/python/tools/test_import_special_phrases.py
@@ -2,20 +2,17 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
     Tests for import special phrases methods
     of the class SPImporter.
 """
-from shutil import copyfile
 import pytest
 from nominatim_db.tools.special_phrases.sp_importer import SPImporter
 from nominatim_db.tools.special_phrases.sp_wiki_loader import SPWikiLoader
 from nominatim_db.tools.special_phrases.special_phrase import SpecialPhrase
-from nominatim_db.errors import UsageError
 
-from cursor import CursorForTesting
 
 @pytest.fixture
 def sp_importer(temp_db_conn, def_config, monkeypatch):
@@ -53,6 +50,7 @@ def test_fetch_existing_place_classtype_tables(sp_importer, table_factory):
     contained_table = sp_importer.table_phrases_to_delete.pop()
     assert contained_table == 'place_classtype_testclasstypetable'
 
+
 def test_check_sanity_class(sp_importer):
     """
         Check for _check_sanity() method.
@@ -65,6 +63,7 @@ def test_check_sanity_class(sp_importer):
 
     assert sp_importer._check_sanity(SpecialPhrase('en', 'class', 'type', ''))
 
+
 def test_load_white_and_black_lists(sp_importer):
     """
         Test that _load_white_and_black_lists() well return
@@ -93,6 +92,7 @@ def test_create_place_classtype_indexes(temp_db_with_extensions,
 
     assert check_placeid_and_centroid_indexes(temp_db_cursor, phrase_class, phrase_type)
 
+
 def test_create_place_classtype_table(temp_db_conn, temp_db_cursor, placex_table, sp_importer):
     """
         Test that _create_place_classtype_table() create
@@ -105,6 +105,7 @@ def test_create_place_classtype_table(temp_db_conn, temp_db_cursor, placex_table
 
     assert check_table_exist(temp_db_cursor, phrase_class, phrase_type)
 
+
 def test_grant_access_to_web_user(temp_db_conn, temp_db_cursor, table_factory,
                                   def_config, sp_importer):
     """
@@ -120,11 +121,13 @@ def test_grant_access_to_web_user(temp_db_conn, temp_db_cursor, table_factory,
     sp_importer._grant_access_to_webuser(phrase_class, phrase_type)
     temp_db_conn.commit()
 
-    assert check_grant_access(temp_db_cursor, def_config.DATABASE_WEBUSER, phrase_class, phrase_type)
+    assert check_grant_access(temp_db_cursor, def_config.DATABASE_WEBUSER,
+                              phrase_class, phrase_type)
+
 
 def test_create_place_classtype_table_and_indexes(
         temp_db_cursor, def_config, placex_table,
-        sp_importer, temp_db_conn):
+        sp_importer, temp_db_conn, monkeypatch):
     """
         Test that _create_place_classtype_table_and_indexes()
         create the right place_classtype tables and place_id indexes
@@ -132,7 +135,8 @@ def test_create_place_classtype_table_and_indexes(
         for the given set of pairs.
     """
     pairs = set([('class1', 'type1'), ('class2', 'type2')])
-
+    for pair in pairs:
+        placex_table.add(cls=pair[0], typ=pair[1])   # adding to db
     sp_importer._create_classtype_table_and_indexes(pairs)
     temp_db_conn.commit()
 
@@ -141,6 +145,7 @@ def test_create_place_classtype_table_and_indexes(
         assert check_placeid_and_centroid_indexes(temp_db_cursor, pair[0], pair[1])
         assert check_grant_access(temp_db_cursor, def_config.DATABASE_WEBUSER, pair[0], pair[1])
 
+
 def test_remove_non_existent_tables_from_db(sp_importer, default_phrases,
                                             temp_db_conn, temp_db_cursor):
     """
@@ -168,7 +173,7 @@ def test_remove_non_existent_tables_from_db(sp_importer, default_phrases,
     temp_db_conn.commit()
 
     assert temp_db_cursor.row_set(query_tables) \
-                 == {('place_classtype_testclasstypetable_to_keep', )}
+        == {('place_classtype_testclasstypetable_to_keep', )}
 
 
 @pytest.mark.parametrize("should_replace", [(True), (False)])
@@ -182,22 +187,24 @@ def test_import_phrases(monkeypatch, temp_db_cursor, def_config, sp_importer,
         It should also update the database well by deleting or preserving existing entries
         of the database.
     """
-    #Add some data to the database before execution in order to test
-    #what is deleted and what is preserved.
+    # Add some data to the database before execution in order to test
+    # what is deleted and what is preserved.
     table_factory('place_classtype_amenity_animal_shelter')
     table_factory('place_classtype_wrongclass_wrongtype')
 
     monkeypatch.setattr('nominatim_db.tools.special_phrases.sp_wiki_loader._get_wiki_content',
                         lambda lang: xml_wiki_content)
 
+    class_test = 'aerialway'
+    type_test = 'zip_line'
+
     tokenizer = tokenizer_mock()
+    placex_table.add(cls=class_test, typ=type_test)  # in db for special phrase filtering
+    placex_table.add(cls='amenity', typ='animal_shelter')  # in db for special phrase filtering
     sp_importer.import_phrases(tokenizer, should_replace)
 
     assert len(tokenizer.analyser_cache['special_phrases']) == 18
 
-    class_test = 'aerialway'
-    type_test = 'zip_line'
-
     assert check_table_exist(temp_db_cursor, class_test, type_test)
     assert check_placeid_and_centroid_indexes(temp_db_cursor, class_test, type_test)
     assert check_grant_access(temp_db_cursor, def_config.DATABASE_WEBUSER, class_test, type_test)
@@ -209,6 +216,7 @@ def test_import_phrases(monkeypatch, temp_db_cursor, def_config, sp_importer,
     if should_replace:
         assert not temp_db_cursor.table_exists('place_classtype_wrongclass_wrongtype')
 
+
 def check_table_exist(temp_db_cursor, phrase_class, phrase_type):
     """
         Verify that the place_classtype table exists for the given
@@ -231,6 +239,7 @@ def check_grant_access(temp_db_cursor, user, phrase_class, phrase_type):
             AND privilege_type='SELECT'""".format(table_name, user))
     return temp_db_cursor.fetchone()
 
+
 def check_placeid_and_centroid_indexes(temp_db_cursor, phrase_class, phrase_type):
     """
         Check that the place_id index and centroid index exist for the
@@ -244,3 +253,38 @@ def check_placeid_and_centroid_indexes(temp_db_cursor, phrase_class, phrase_type
         and
         temp_db_cursor.index_exists(table_name, index_prefix + 'place_id')
     )
+
+
+@pytest.mark.parametrize("should_replace", [(True), (False)])
+def test_import_phrases_special_phrase_filtering(monkeypatch, temp_db_cursor, def_config,
+                                                 sp_importer, placex_table, tokenizer_mock,
+                                                 xml_wiki_content, should_replace):
+
+    monkeypatch.setattr('nominatim_db.tools.special_phrases.sp_wiki_loader._get_wiki_content',
+                        lambda lang: xml_wiki_content)
+
+    class_test = 'aerialway'
+    type_test = 'zip_line'
+
+    placex_table.add(cls=class_test, typ=type_test)  # add to the database to make valid
+    tokenizer = tokenizer_mock()
+    sp_importer.import_phrases(tokenizer, should_replace)
+
+    assert ('Zip Line', 'aerialway', 'zip_line', '-') in sp_importer.word_phrases
+    assert check_table_exist(temp_db_cursor, class_test, type_test)
+    assert check_placeid_and_centroid_indexes(temp_db_cursor, class_test, type_test)
+    assert check_grant_access(temp_db_cursor, def_config.DATABASE_WEBUSER, class_test, type_test)
+
+
+def test_get_classtype_pairs_directly(placex_table, temp_db_conn, sp_importer):
+    for _ in range(101):
+        placex_table.add(cls='highway', typ='residential')
+    for _ in range(99):
+        placex_table.add(cls='amenity', typ='toilet')
+
+    temp_db_conn.commit()
+
+    result = sp_importer.get_classtype_pairs(100)
+    print("RESULT:", result)
+    assert ('highway', 'residential') in result
+    assert ('amenity', 'toilet') not in result
diff --git a/test/python/tools/test_migration.py b/test/python/tools/test_migration.py
index 0b4d2ec6..00f6a7d7 100644
--- a/test/python/tools/test_migration.py
+++ b/test/python/tools/test_migration.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for migration functions
@@ -11,9 +11,9 @@ import pytest
 
 from nominatim_db.tools import migration
 from nominatim_db.errors import UsageError
-from nominatim_db.db.connection import server_version_tuple
 import nominatim_db.version
 
+
 class DummyTokenizer:
 
     def update_sql_functions(self, config):
@@ -49,6 +49,7 @@ def test_run_single_migration(temp_db_with_extensions, def_config, temp_db_curso
                        str(nominatim_db.version.NominatimVersion(*oldversion)))
 
     done = {'old': False, 'new': False}
+
     def _migration(**_):
         """ Dummy migration"""
         done['new'] = True
@@ -69,7 +70,7 @@ def test_run_single_migration(temp_db_with_extensions, def_config, temp_db_curso
     assert property_table.get('database_version') == str(nominatim_db.version.NOMINATIM_VERSION)
 
 
-###### Tests for specific migrations
+# Tests for specific migrations
 #
 # Each migration should come with two tests:
 #  1. Test that migration from old to new state works as expected.
diff --git a/test/python/tools/test_postcodes.py b/test/python/tools/test_postcodes.py
index f035bb19..fcf34a3b 100644
--- a/test/python/tools/test_postcodes.py
+++ b/test/python/tools/test_postcodes.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for functions to maintain the artificial postcode table.
@@ -15,6 +15,7 @@ from nominatim_db.tools import postcodes
 from nominatim_db.data import country_info
 import dummy_tokenizer
 
+
 class MockPostcodeTable:
     """ A location_postcode table for testing.
     """
@@ -35,7 +36,7 @@ class MockPostcodeTable:
                            RETURNS TEXT AS $$ BEGIN RETURN postcode; END; $$ LANGUAGE plpgsql;
 
                            CREATE OR REPLACE FUNCTION get_country_code(place geometry)
-                           RETURNS TEXT AS $$ BEGIN 
+                           RETURNS TEXT AS $$ BEGIN
                            RETURN null;
                            END; $$ LANGUAGE plpgsql;
                         """)
@@ -51,7 +52,6 @@ class MockPostcodeTable:
                         (country, postcode, x, y))
         self.conn.commit()
 
-
     @property
     def row_set(self):
         with self.conn.cursor() as cur:
@@ -63,7 +63,7 @@ class MockPostcodeTable:
 
 @pytest.fixture
 def tokenizer():
-    return dummy_tokenizer.DummyTokenizer(None, None)
+    return dummy_tokenizer.DummyTokenizer(None)
 
 
 @pytest.fixture
@@ -85,19 +85,17 @@ def insert_implicit_postcode(placex_table, place_row):
     return _insert_implicit_postcode
 
 
-def test_postcodes_empty(dsn, postcode_table, place_table,
-                         tmp_path, tokenizer):
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+def test_postcodes_empty(dsn, postcode_table, place_table, tokenizer):
+    postcodes.update_postcodes(dsn, None, tokenizer)
 
     assert not postcode_table.row_set
 
 
-def test_postcodes_add_new(dsn, postcode_table, tmp_path,
-                           insert_implicit_postcode, tokenizer):
+def test_postcodes_add_new(dsn, postcode_table, insert_implicit_postcode, tokenizer):
     insert_implicit_postcode(1, 'xx', 'POINT(10 12)', dict(postcode='9486'))
     postcode_table.add('yy', '9486', 99, 34)
 
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+    postcodes.update_postcodes(dsn, None, tokenizer)
 
     assert postcode_table.row_set == {('xx', '9486', 10, 12), }
 
@@ -112,49 +110,48 @@ def test_postcodes_replace_coordinates(dsn, postcode_table, tmp_path,
     assert postcode_table.row_set == {('xx', 'AB 4511', 10, 12)}
 
 
-def test_postcodes_replace_coordinates_close(dsn, postcode_table, tmp_path,
+def test_postcodes_replace_coordinates_close(dsn, postcode_table,
                                              insert_implicit_postcode, tokenizer):
     insert_implicit_postcode(1, 'xx', 'POINT(10 12)', dict(postcode='AB 4511'))
     postcode_table.add('xx', 'AB 4511', 10, 11.99999)
 
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+    postcodes.update_postcodes(dsn, None, tokenizer)
 
     assert postcode_table.row_set == {('xx', 'AB 4511', 10, 11.99999)}
 
 
-def test_postcodes_remove(dsn, postcode_table, tmp_path,
+def test_postcodes_remove(dsn, postcode_table,
                           insert_implicit_postcode, tokenizer):
     insert_implicit_postcode(1, 'xx', 'POINT(10 12)', dict(postcode='AB 4511'))
     postcode_table.add('xx', 'badname', 10, 12)
 
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+    postcodes.update_postcodes(dsn, None, tokenizer)
 
     assert postcode_table.row_set == {('xx', 'AB 4511', 10, 12)}
 
 
-def test_postcodes_ignore_empty_country(dsn, postcode_table, tmp_path,
+def test_postcodes_ignore_empty_country(dsn, postcode_table,
                                         insert_implicit_postcode, tokenizer):
     insert_implicit_postcode(1, None, 'POINT(10 12)', dict(postcode='AB 4511'))
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+    postcodes.update_postcodes(dsn, None, tokenizer)
     assert not postcode_table.row_set
 
 
-def test_postcodes_remove_all(dsn, postcode_table, place_table,
-                              tmp_path, tokenizer):
+def test_postcodes_remove_all(dsn, postcode_table, place_table, tokenizer):
     postcode_table.add('ch', '5613', 10, 12)
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+    postcodes.update_postcodes(dsn, None, tokenizer)
 
     assert not postcode_table.row_set
 
 
-def test_postcodes_multi_country(dsn, postcode_table, tmp_path,
+def test_postcodes_multi_country(dsn, postcode_table,
                                  insert_implicit_postcode, tokenizer):
     insert_implicit_postcode(1, 'de', 'POINT(10 12)', dict(postcode='54451'))
     insert_implicit_postcode(2, 'cc', 'POINT(100 56)', dict(postcode='DD23 T'))
     insert_implicit_postcode(3, 'de', 'POINT(10.3 11.0)', dict(postcode='54452'))
     insert_implicit_postcode(4, 'cc', 'POINT(10.3 11.0)', dict(postcode='54452'))
 
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+    postcodes.update_postcodes(dsn, None, tokenizer)
 
     assert postcode_table.row_set == {('de', '54451', 10, 12),
                                       ('de', '54452', 10.3, 11.0),
@@ -180,7 +177,7 @@ def test_postcodes_extern(dsn, postcode_table, tmp_path,
                                       ('xx', 'CD 4511', -10, -5)}
 
 
-def test_postcodes_extern_bad_column(dsn, postcode_table, tmp_path, 
+def test_postcodes_extern_bad_column(dsn, postcode_table, tmp_path,
                                      insert_implicit_postcode, tokenizer):
     insert_implicit_postcode(1, 'xx', 'POINT(10 12)', dict(postcode='AB 4511'))
 
@@ -204,35 +201,37 @@ def test_postcodes_extern_bad_number(dsn, insert_implicit_postcode,
     assert postcode_table.row_set == {('xx', 'AB 4511', 10, 12),
                                       ('xx', 'CD 4511', -10, -5)}
 
+
 def test_can_compute(dsn, table_factory):
     assert not postcodes.can_compute(dsn)
     table_factory('place')
     assert postcodes.can_compute(dsn)
 
 
-def test_no_placex_entry(dsn, tmp_path, temp_db_cursor, place_row, postcode_table, tokenizer):
-    #Rewrite the get_country_code function to verify its execution.
+def test_no_placex_entry(dsn, temp_db_cursor, place_row, postcode_table, tokenizer):
+    # Rewrite the get_country_code function to verify its execution.
     temp_db_cursor.execute("""
         CREATE OR REPLACE FUNCTION get_country_code(place geometry)
-        RETURNS TEXT AS $$ BEGIN 
+        RETURNS TEXT AS $$ BEGIN
         RETURN 'yy';
         END; $$ LANGUAGE plpgsql;
     """)
     place_row(geom='SRID=4326;POINT(10 12)', address=dict(postcode='AB 4511'))
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+    postcodes.update_postcodes(dsn, None, tokenizer)
 
     assert postcode_table.row_set == {('yy', 'AB 4511', 10, 12)}
 
 
-def test_discard_badly_formatted_postcodes(dsn, tmp_path, temp_db_cursor, place_row, postcode_table, tokenizer):
-    #Rewrite the get_country_code function to verify its execution.
+def test_discard_badly_formatted_postcodes(dsn, temp_db_cursor, place_row,
+                                           postcode_table, tokenizer):
+    # Rewrite the get_country_code function to verify its execution.
     temp_db_cursor.execute("""
         CREATE OR REPLACE FUNCTION get_country_code(place geometry)
-        RETURNS TEXT AS $$ BEGIN 
+        RETURNS TEXT AS $$ BEGIN
         RETURN 'fr';
         END; $$ LANGUAGE plpgsql;
     """)
     place_row(geom='SRID=4326;POINT(10 12)', address=dict(postcode='AB 4511'))
-    postcodes.update_postcodes(dsn, tmp_path, tokenizer)
+    postcodes.update_postcodes(dsn, None, tokenizer)
 
     assert not postcode_table.row_set
diff --git a/test/python/tools/test_refresh.py b/test/python/tools/test_refresh.py
index 1f1968cf..95feef0d 100644
--- a/test/python/tools/test_refresh.py
+++ b/test/python/tools/test_refresh.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Test for various refresh functions.
@@ -12,7 +12,7 @@ from pathlib import Path
 import pytest
 
 from nominatim_db.tools import refresh
-from nominatim_db.db.connection import postgis_version_tuple
+
 
 def test_refresh_import_wikipedia_not_existing(dsn):
     assert refresh.import_wikipedia_articles(dsn, Path('.')) == 1
@@ -21,16 +21,13 @@ def test_refresh_import_wikipedia_not_existing(dsn):
 def test_refresh_import_secondary_importance_non_existing(dsn):
     assert refresh.import_secondary_importance(dsn, Path('.')) == 1
 
+
 def test_refresh_import_secondary_importance_testdb(dsn, src_dir, temp_db_conn, temp_db_cursor):
     temp_db_cursor.execute('CREATE EXTENSION postgis')
+    temp_db_cursor.execute('CREATE EXTENSION postgis_raster')
+    assert refresh.import_secondary_importance(dsn, src_dir / 'test' / 'testdb') == 0
 
-    if postgis_version_tuple(temp_db_conn)[0] < 3:
-        assert refresh.import_secondary_importance(dsn, src_dir / 'test' / 'testdb') > 0
-    else:
-        temp_db_cursor.execute('CREATE EXTENSION postgis_raster')
-        assert refresh.import_secondary_importance(dsn, src_dir / 'test' / 'testdb') == 0
-
-        assert temp_db_cursor.table_exists('secondary_importance')
+    assert temp_db_cursor.table_exists('secondary_importance')
 
 
 @pytest.mark.parametrize("replace", (True, False))
@@ -41,8 +38,7 @@ def test_refresh_import_wikipedia(dsn, src_dir, table_factory, temp_db_cursor, r
     # use the small wikipedia file for the API testdb
     assert refresh.import_wikipedia_articles(dsn, src_dir / 'test' / 'testdb') == 0
 
-    assert temp_db_cursor.table_rows('wikipedia_article') > 0
-    assert temp_db_cursor.table_rows('wikipedia_redirect') > 0
+    assert temp_db_cursor.table_rows('wikimedia_importance') > 0
 
 
 def test_recompute_importance(placex_table, table_factory, temp_db_conn, temp_db_cursor):
diff --git a/test/python/tools/test_refresh_address_levels.py b/test/python/tools/test_refresh_address_levels.py
index 6e094cdc..f2bfdea6 100644
--- a/test/python/tools/test_refresh_address_levels.py
+++ b/test/python/tools/test_refresh_address_levels.py
@@ -2,23 +2,24 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for function for importing address ranks.
 """
 import json
-from pathlib import Path
 
 import pytest
 
 from nominatim_db.tools.refresh import load_address_levels, load_address_levels_from_config
 
+
 def test_load_ranks_def_config(temp_db_conn, temp_db_cursor, def_config):
     load_address_levels_from_config(temp_db_conn, def_config)
 
     assert temp_db_cursor.table_rows('address_levels') > 0
 
+
 def test_load_ranks_from_project_dir(project_env, temp_db_conn, temp_db_cursor):
     test_file = project_env.project_dir / 'address-levels.json'
     test_file.write_text('[{"tags":{"place":{"sea":2}}}]')
@@ -43,14 +44,14 @@ def test_load_ranks_country(temp_db_conn, temp_db_cursor):
                           "tags": {"place": {"village": 15}}},
                          {"countries": ['uk', 'us'],
                           "tags": {"place": {"village": 16}}}
-                        ])
+                         ])
 
     assert temp_db_cursor.row_set('SELECT * FROM levels') == \
            set([(None, 'place', 'village', 14, 14),
                 ('de', 'place', 'village', 15, 15),
                 ('uk', 'place', 'village', 16, 16),
                 ('us', 'place', 'village', 16, 16),
-               ])
+                ])
 
 
 def test_load_ranks_default_value(temp_db_conn, temp_db_cursor):
@@ -58,33 +59,33 @@ def test_load_ranks_default_value(temp_db_conn, temp_db_cursor):
                         [{"tags": {"boundary": {"": 28}}},
                          {"countries": ['hu'],
                           "tags": {"boundary": {"": 29}}}
-                        ])
+                         ])
 
     assert temp_db_cursor.row_set('SELECT * FROM levels') == \
            set([(None, 'boundary', None, 28, 28),
                 ('hu', 'boundary', None, 29, 29),
-               ])
+                ])
 
 
 def test_load_ranks_multiple_keys(temp_db_conn, temp_db_cursor):
     load_address_levels(temp_db_conn, 'levels',
                         [{"tags": {"place": {"city": 14},
-                                   "boundary": {"administrative2" : 4}}
-                         }])
+                                   "boundary": {"administrative2": 4}}
+                          }])
 
     assert temp_db_cursor.row_set('SELECT * FROM levels') == \
            set([(None, 'place', 'city', 14, 14),
                 (None, 'boundary', 'administrative2', 4, 4),
-               ])
+                ])
 
 
 def test_load_ranks_address(temp_db_conn, temp_db_cursor):
     load_address_levels(temp_db_conn, 'levels',
                         [{"tags": {"place": {"city": 14,
-                                             "town" : [14, 13]}}
-                         }])
+                                             "town": [14, 13]}}
+                          }])
 
     assert temp_db_cursor.row_set('SELECT * FROM levels') == \
            set([(None, 'place', 'city', 14, 14),
                 (None, 'place', 'town', 14, 13),
-               ])
+                ])
diff --git a/test/python/tools/test_refresh_create_functions.py b/test/python/tools/test_refresh_create_functions.py
index 984a1610..bd8724d6 100644
--- a/test/python/tools/test_refresh_create_functions.py
+++ b/test/python/tools/test_refresh_create_functions.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for creating PL/pgSQL functions for Nominatim.
@@ -11,6 +11,7 @@ import pytest
 
 from nominatim_db.tools.refresh import create_functions
 
+
 class TestCreateFunctions:
     @pytest.fixture(autouse=True)
     def init_env(self, sql_preprocessor, temp_db_conn, def_config, tmp_path):
@@ -18,12 +19,10 @@ class TestCreateFunctions:
         self.config = def_config
         def_config.lib_dir.sql = tmp_path
 
-
     def write_functions(self, content):
         sqlfile = self.config.lib_dir.sql / 'functions.sql'
         sqlfile.write_text(content)
 
-
     def test_create_functions(self, temp_db_cursor):
         self.write_functions("""CREATE OR REPLACE FUNCTION test() RETURNS INTEGER
                               AS $$
@@ -37,7 +36,6 @@ class TestCreateFunctions:
 
         assert temp_db_cursor.scalar('SELECT test()') == 43
 
-
     @pytest.mark.parametrize("dbg,ret", ((True, 43), (False, 22)))
     def test_create_functions_with_template(self, temp_db_cursor, dbg, ret):
         self.write_functions("""CREATE OR REPLACE FUNCTION test() RETURNS INTEGER
diff --git a/test/python/tools/test_refresh_wiki_data.py b/test/python/tools/test_refresh_wiki_data.py
index 997ba04d..046e9191 100644
--- a/test/python/tools/test_refresh_wiki_data.py
+++ b/test/python/tools/test_refresh_wiki_data.py
@@ -12,7 +12,10 @@ import csv
 
 import pytest
 
-from nominatim_db.tools.refresh import import_wikipedia_articles, recompute_importance, create_functions
+from nominatim_db.tools.refresh import (import_wikipedia_articles,
+                                        recompute_importance,
+                                        create_functions)
+
 
 @pytest.fixture
 def wiki_csv(tmp_path, sql_preprocessor):
@@ -25,7 +28,7 @@ def wiki_csv(tmp_path, sql_preprocessor):
             for lang, title, importance, wd in data:
                 writer.writerow({'language': lang, 'type': 'a',
                                  'title': title, 'importance': str(importance),
-                                 'wikidata_id' : wd})
+                                 'wikidata_id': wd})
         return tmp_path
 
     return _import
diff --git a/test/python/tools/test_replication.py b/test/python/tools/test_replication.py
index 392ea075..347899bd 100644
--- a/test/python/tools/test_replication.py
+++ b/test/python/tools/test_replication.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for replication functionality.
@@ -22,13 +22,15 @@ OSM_NODE_DATA = """\
 <node id="100" visible="true" version="1" changeset="2047" timestamp="2006-01-27T22:09:10Z" user="Foo" uid="111" lat="48.7586670" lon="8.1343060">
 </node>
 </osm>
-"""
+"""  # noqa
+
 
 @pytest.fixture(autouse=True)
 def setup_status_table(status_table):
     pass
 
-### init replication
+
+# init replication
 
 def test_init_replication_bad_base_url(monkeypatch, place_row, temp_db_conn):
     place_row(osm_type='N', osm_id=100)
@@ -50,13 +52,13 @@ def test_init_replication_success(monkeypatch, place_row, temp_db_conn, temp_db_
     nominatim_db.tools.replication.init_replication(temp_db_conn, 'https://test.io')
 
     expected_date = dt.datetime.strptime('2006-01-27T19:09:10', status.ISODATE_FORMAT)\
-                        .replace(tzinfo=dt.timezone.utc)
+                      .replace(tzinfo=dt.timezone.utc)
 
     assert temp_db_cursor.row_set("SELECT * FROM import_status") \
-             == {(expected_date, 234, True)}
+        == {(expected_date, 234, True)}
 
 
-### checking for updates
+# checking for updates
 
 def test_check_for_updates_empty_status_table(temp_db_conn):
     assert nominatim_db.tools.replication.check_for_updates(temp_db_conn, 'https://test.io') == 254
@@ -87,10 +89,11 @@ def test_check_for_updates_no_new_data(monkeypatch, temp_db_conn,
                         "get_state_info",
                         lambda self: OsmosisState(server_sequence, date))
 
-    assert nominatim_db.tools.replication.check_for_updates(temp_db_conn, 'https://test.io') == result
+    assert result == \
+        nominatim_db.tools.replication.check_for_updates(temp_db_conn, 'https://test.io')
 
 
-### updating
+# updating
 
 @pytest.fixture
 def update_options(tmpdir):
@@ -100,6 +103,7 @@ def update_options(tmpdir):
                 import_file=tmpdir / 'foo.osm',
                 max_diff_size=1)
 
+
 def test_update_empty_status_table(dsn):
     with pytest.raises(UsageError):
         nominatim_db.tools.replication.update(dsn, {})
@@ -109,7 +113,7 @@ def test_update_already_indexed(temp_db_conn, dsn):
     status.set_status(temp_db_conn, dt.datetime.now(dt.timezone.utc), seq=34, indexed=False)
 
     assert nominatim_db.tools.replication.update(dsn, dict(indexed_only=True)) \
-             == nominatim_db.tools.replication.UpdateState.MORE_PENDING
+        == nominatim_db.tools.replication.UpdateState.MORE_PENDING
 
 
 def test_update_no_data_no_sleep(monkeypatch, temp_db_conn, dsn, update_options):
@@ -124,7 +128,7 @@ def test_update_no_data_no_sleep(monkeypatch, temp_db_conn, dsn, update_options)
     monkeypatch.setattr(time, 'sleep', sleeptime.append)
 
     assert nominatim_db.tools.replication.update(dsn, update_options) \
-             == nominatim_db.tools.replication.UpdateState.NO_CHANGES
+        == nominatim_db.tools.replication.UpdateState.NO_CHANGES
 
     assert not sleeptime
 
@@ -141,7 +145,7 @@ def test_update_no_data_sleep(monkeypatch, temp_db_conn, dsn, update_options):
     monkeypatch.setattr(time, 'sleep', sleeptime.append)
 
     assert nominatim_db.tools.replication.update(dsn, update_options) \
-             == nominatim_db.tools.replication.UpdateState.NO_CHANGES
+        == nominatim_db.tools.replication.UpdateState.NO_CHANGES
 
     assert len(sleeptime) == 1
     assert sleeptime[0] < 3600
diff --git a/test/python/tools/test_sp_csv_loader.py b/test/python/tools/test_sp_csv_loader.py
index 9d0ad9cc..67d6eed5 100644
--- a/test/python/tools/test_sp_csv_loader.py
+++ b/test/python/tools/test_sp_csv_loader.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
     Tests for methods of the SPCsvLoader class.
@@ -13,6 +13,7 @@ from nominatim_db.errors import UsageError
 from nominatim_db.tools.special_phrases.sp_csv_loader import SPCsvLoader
 from nominatim_db.tools.special_phrases.special_phrase import SpecialPhrase
 
+
 @pytest.fixture
 def sp_csv_loader(src_dir):
     """
diff --git a/test/python/tools/test_sp_importer.py b/test/python/tools/test_sp_importer.py
new file mode 100644
index 00000000..dda02f11
--- /dev/null
+++ b/test/python/tools/test_sp_importer.py
@@ -0,0 +1,69 @@
+from nominatim_db.tools.special_phrases.sp_importer import SPImporter
+
+
+# Testing Database Class Pair Retrival using Conftest.py and placex
+def test_get_classtype_pair_data(placex_table, def_config, temp_db_conn):
+    for _ in range(101):
+        placex_table.add(cls='highway', typ='motorway')  # edge case 101
+
+    for _ in range(99):
+        placex_table.add(cls='amenity', typ='prison')  # edge case 99
+
+    for _ in range(150):
+        placex_table.add(cls='tourism', typ='hotel')
+
+    importer = SPImporter(config=def_config, conn=temp_db_conn, sp_loader=None)
+
+    result = importer.get_classtype_pairs(min=100)
+
+    expected = {
+        ("highway", "motorway"),
+        ("tourism", "hotel")
+    }
+
+    assert result == expected, f"Expected {expected}, got {result}"
+
+
+def test_get_classtype_pair_data_more(placex_table, def_config, temp_db_conn):
+    for _ in range(100):
+        placex_table.add(cls='emergency', typ='firehydrant')  # edge case 100, not included
+
+    for _ in range(199):
+        placex_table.add(cls='amenity', typ='prison')
+
+    for _ in range(3478):
+        placex_table.add(cls='tourism', typ='hotel')
+
+    importer = SPImporter(config=def_config, conn=temp_db_conn, sp_loader=None)
+
+    result = importer.get_classtype_pairs(min=100)
+
+    expected = {
+        ("amenity", "prison"),
+        ("tourism", "hotel")
+    }
+
+    assert result == expected, f"Expected {expected}, got {result}"
+
+
+def test_get_classtype_pair_data_default(placex_table, def_config, temp_db_conn):
+    for _ in range(1):
+        placex_table.add(cls='emergency', typ='firehydrant')
+
+    for _ in range(199):
+        placex_table.add(cls='amenity', typ='prison')
+
+    for _ in range(3478):
+        placex_table.add(cls='tourism', typ='hotel')
+
+    importer = SPImporter(config=def_config, conn=temp_db_conn, sp_loader=None)
+
+    result = importer.get_classtype_pairs()
+
+    expected = {
+        ("amenity", "prison"),
+        ("tourism", "hotel"),
+        ("emergency", "firehydrant")
+    }
+
+    assert result == expected, f"Expected {expected}, got {result}"
diff --git a/test/python/tools/test_sp_wiki_loader.py b/test/python/tools/test_sp_wiki_loader.py
index 5c37c32f..b8e41cbe 100644
--- a/test/python/tools/test_sp_wiki_loader.py
+++ b/test/python/tools/test_sp_wiki_loader.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
     Tests for methods of the SPWikiLoader class.
@@ -36,22 +36,22 @@ def test_generate_phrases(sp_wiki_loader):
     """
     phrases = list(sp_wiki_loader.generate_phrases())
 
-    assert set((p.p_label, p.p_class, p.p_type, p.p_operator) for p in phrases) ==\
-              {('Zip Line', 'aerialway', 'zip_line', '-'),
-               ('Zip Lines', 'aerialway', 'zip_line', '-'),
-               ('Zip Line in', 'aerialway', 'zip_line', 'in'),
-               ('Zip Lines in', 'aerialway', 'zip_line', 'in'),
-               ('Zip Line near', 'aerialway', 'zip_line', 'near'),
-               ('Animal shelter', 'amenity', 'animal_shelter', '-'),
-               ('Animal shelters', 'amenity', 'animal_shelter', '-'),
-               ('Animal shelter in', 'amenity', 'animal_shelter', 'in'),
-               ('Animal shelters in', 'amenity', 'animal_shelter', 'in'),
-               ('Animal shelter near', 'amenity', 'animal_shelter', 'near'),
-               ('Animal shelters near', 'amenity', 'animal_shelter', 'near'),
-               ('Drinking Water near', 'amenity', 'drinking_water', 'near'),
-               ('Water', 'amenity', 'drinking_water', '-'),
-               ('Water in', 'amenity', 'drinking_water', 'in'),
-               ('Water near', 'amenity', 'drinking_water', 'near'),
-               ('Embassy', 'amenity', 'embassy', '-'),
-               ('Embassys', 'amenity', 'embassy', '-'),
-               ('Embassies', 'amenity', 'embassy', '-')}
+    assert set((p.p_label, p.p_class, p.p_type, p.p_operator) for p in phrases) == \
+        {('Zip Line', 'aerialway', 'zip_line', '-'),
+         ('Zip Lines', 'aerialway', 'zip_line', '-'),
+         ('Zip Line in', 'aerialway', 'zip_line', 'in'),
+         ('Zip Lines in', 'aerialway', 'zip_line', 'in'),
+         ('Zip Line near', 'aerialway', 'zip_line', 'near'),
+         ('Animal shelter', 'amenity', 'animal_shelter', '-'),
+         ('Animal shelters', 'amenity', 'animal_shelter', '-'),
+         ('Animal shelter in', 'amenity', 'animal_shelter', 'in'),
+         ('Animal shelters in', 'amenity', 'animal_shelter', 'in'),
+         ('Animal shelter near', 'amenity', 'animal_shelter', 'near'),
+         ('Animal shelters near', 'amenity', 'animal_shelter', 'near'),
+         ('Drinking Water near', 'amenity', 'drinking_water', 'near'),
+         ('Water', 'amenity', 'drinking_water', '-'),
+         ('Water in', 'amenity', 'drinking_water', 'in'),
+         ('Water near', 'amenity', 'drinking_water', 'near'),
+         ('Embassy', 'amenity', 'embassy', '-'),
+         ('Embassys', 'amenity', 'embassy', '-'),
+         ('Embassies', 'amenity', 'embassy', '-')}
diff --git a/test/python/tools/test_tiger_data.py b/test/python/tools/test_tiger_data.py
index 5d65fafb..f7dfe32e 100644
--- a/test/python/tools/test_tiger_data.py
+++ b/test/python/tools/test_tiger_data.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Test for tiger data function
@@ -11,12 +11,13 @@ import tarfile
 from textwrap import dedent
 
 import pytest
-import pytest_asyncio
+import pytest_asyncio  # noqa: F401
 
 from nominatim_db.db.connection import execute_scalar
 from nominatim_db.tools import tiger_data, freeze
 from nominatim_db.errors import UsageError
 
+
 class MockTigerTable:
 
     def __init__(self, conn):
@@ -40,6 +41,7 @@ class MockTigerTable:
             cur.execute("SELECT * FROM tiger LIMIT 1")
             return cur.fetchone()
 
+
 @pytest.fixture
 def tiger_table(def_config, temp_db_conn, sql_preprocessor,
                 temp_db_with_extensions, tmp_path):
@@ -87,7 +89,7 @@ async def test_add_tiger_data(def_config, src_dir, tiger_table, tokenizer_mock,
 
 @pytest.mark.asyncio
 async def test_add_tiger_data_database_frozen(def_config, temp_db_conn, tiger_table, tokenizer_mock,
-                                 tmp_path):
+                                              tmp_path):
     freeze.drop_update_tables(temp_db_conn)
 
     with pytest.raises(UsageError) as excinfo:
@@ -100,7 +102,7 @@ async def test_add_tiger_data_database_frozen(def_config, temp_db_conn, tiger_ta
 
 @pytest.mark.asyncio
 async def test_add_tiger_data_no_files(def_config, tiger_table, tokenizer_mock,
-                                 tmp_path):
+                                       tmp_path):
     await tiger_data.add_tiger_data(str(tmp_path), def_config, 1, tokenizer_mock())
 
     assert tiger_table.count() == 0
@@ -108,7 +110,7 @@ async def test_add_tiger_data_no_files(def_config, tiger_table, tokenizer_mock,
 
 @pytest.mark.asyncio
 async def test_add_tiger_data_bad_file(def_config, tiger_table, tokenizer_mock,
-                                 tmp_path):
+                                       tmp_path):
     sqlfile = tmp_path / '1010.csv'
     sqlfile.write_text("""Random text""")
 
@@ -119,7 +121,7 @@ async def test_add_tiger_data_bad_file(def_config, tiger_table, tokenizer_mock,
 
 @pytest.mark.asyncio
 async def test_add_tiger_data_hnr_nan(def_config, tiger_table, tokenizer_mock,
-                                csv_factory, tmp_path):
+                                      csv_factory, tmp_path):
     csv_factory('file1', hnr_from=99)
     csv_factory('file2', hnr_from='L12')
     csv_factory('file3', hnr_to='12.4')
@@ -133,7 +135,7 @@ async def test_add_tiger_data_hnr_nan(def_config, tiger_table, tokenizer_mock,
 @pytest.mark.parametrize("threads", (1, 5))
 @pytest.mark.asyncio
 async def test_add_tiger_data_tarfile(def_config, tiger_table, tokenizer_mock,
-                                tmp_path, src_dir, threads):
+                                      tmp_path, src_dir, threads):
     tar = tarfile.open(str(tmp_path / 'sample.tar.gz'), "w:gz")
     tar.add(str(src_dir / 'test' / 'testdb' / 'tiger' / '01001.csv'))
     tar.close()
@@ -146,7 +148,7 @@ async def test_add_tiger_data_tarfile(def_config, tiger_table, tokenizer_mock,
 
 @pytest.mark.asyncio
 async def test_add_tiger_data_bad_tarfile(def_config, tiger_table, tokenizer_mock,
-                                    tmp_path):
+                                          tmp_path):
     tarfile = tmp_path / 'sample.tar.gz'
     tarfile.write_text("""Random text""")
 
@@ -156,7 +158,7 @@ async def test_add_tiger_data_bad_tarfile(def_config, tiger_table, tokenizer_moc
 
 @pytest.mark.asyncio
 async def test_add_tiger_data_empty_tarfile(def_config, tiger_table, tokenizer_mock,
-                                      tmp_path):
+                                            tmp_path):
     tar = tarfile.open(str(tmp_path / 'sample.tar.gz'), "w:gz")
     tar.add(__file__)
     tar.close()
diff --git a/test/python/utils/test_centroid.py b/test/python/utils/test_centroid.py
index bac0edb3..664d5cd7 100644
--- a/test/python/utils/test_centroid.py
+++ b/test/python/utils/test_centroid.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for centroid computation.
@@ -11,6 +11,7 @@ import pytest
 
 from nominatim_db.utils.centroid import PointsCentroid
 
+
 def test_empty_set():
     c = PointsCentroid()
 
@@ -18,7 +19,7 @@ def test_empty_set():
         c.centroid()
 
 
-@pytest.mark.parametrize("centroid", [(0,0), (-1, 3), [0.0000032, 88.4938]])
+@pytest.mark.parametrize("centroid", [(0, 0), (-1, 3), [0.0000032, 88.4938]])
 def test_one_point_centroid(centroid):
     c = PointsCentroid()
 
diff --git a/test/python/utils/test_json_writer.py b/test/python/utils/test_json_writer.py
index 53e3f4d3..c0946f01 100644
--- a/test/python/utils/test_json_writer.py
+++ b/test/python/utils/test_json_writer.py
@@ -2,7 +2,7 @@
 #
 # This file is part of Nominatim. (https://nominatim.org)
 #
-# Copyright (C) 2024 by the Nominatim developer community.
+# Copyright (C) 2025 by the Nominatim developer community.
 # For a full list of authors see the git log.
 """
 Tests for the streaming JSON writer.
@@ -13,6 +13,7 @@ import pytest
 
 from nominatim_api.utils.json_writer import JsonWriter
 
+
 @pytest.mark.parametrize("inval,outstr", [(None, 'null'),
                                           (True, 'true'), (False, 'false'),
                                           (23, '23'), (0, '0'), (-1.3, '-1.3'),
@@ -71,6 +72,7 @@ def test_object_single_entry():
     assert writer() == '{"something":5}'
     json.loads(writer())
 
+
 def test_object_many_values():
     writer = JsonWriter()\
                 .start_object()\
@@ -82,6 +84,7 @@ def test_object_many_values():
     assert writer() == '{"foo":null,"bar":{},"baz":"b\\taz"}'
     json.loads(writer())
 
+
 def test_object_many_values_without_none():
     writer = JsonWriter()\
                 .start_object()\
@@ -89,7 +92,7 @@ def test_object_many_values_without_none():
                     .keyval_not_none('bar', None)\
                     .keyval_not_none('baz', '')\
                     .keyval_not_none('eve', False,
-                                     transform = lambda v: 'yes' if v else 'no')\
+                                     transform=lambda v: 'yes' if v else 'no')\
                 .end_object()
 
     assert writer() == '{"foo":0,"baz":"","eve":"no"}'
diff --git a/test/testdb/wikimedia-importance.csv.gz b/test/testdb/wikimedia-importance.csv.gz
new file mode 100644
index 00000000..23f6ee69
Binary files /dev/null and b/test/testdb/wikimedia-importance.csv.gz differ
diff --git a/test/testdb/wikimedia-importance.sql.gz b/test/testdb/wikimedia-importance.sql.gz
deleted file mode 100644
index 1024f725..00000000
Binary files a/test/testdb/wikimedia-importance.sql.gz and /dev/null differ