1 # SPDX-License-Identifier: GPL-2.0-only
3 # This file is part of Nominatim. (https://nominatim.org)
5 # Copyright (C) 2022 by the Nominatim developer community.
6 # For a full list of authors see the git log.
8 Nominatim configuration accessor.
10 from typing import Dict, Any, List, Mapping, Optional
15 from pathlib import Path
19 from dotenv import dotenv_values
20 from psycopg2.extensions import parse_dsn
22 from nominatim.typing import StrPath
23 from nominatim.errors import UsageError
24 import nominatim.paths
26 LOG = logging.getLogger()
27 CONFIG_CACHE : Dict[str, Any] = {}
29 def flatten_config_list(content: Any, section: str = '') -> List[Any]:
30 """ Flatten YAML configuration lists that contain include sections
31 which are lists themselves.
36 if not isinstance(content, list):
37 raise UsageError(f"List expected in section '{section}'.")
41 if isinstance(ele, list):
42 output.extend(flatten_config_list(ele, section))
50 """ Load and manage the project configuration.
52 Nominatim uses dotenv to configure the software. Configuration options
53 are resolved in the following order:
55 * from the OS environment (or the dictionary given in `environ`)
56 * from the .env file in the project directory of the installation
57 * from the default installation in the configuration directory
59 All Nominatim configuration options are prefixed with 'NOMINATIM_' to
60 avoid conflicts with other environment variables.
63 def __init__(self, project_dir: Optional[Path],
64 environ: Optional[Mapping[str, str]] = None) -> None:
65 self.environ = environ or os.environ
66 self.project_dir = project_dir
67 self.config_dir = nominatim.paths.CONFIG_DIR
68 self._config = dotenv_values(str(self.config_dir / 'env.defaults'))
69 if self.project_dir is not None and (self.project_dir / '.env').is_file():
70 self.project_dir = self.project_dir.resolve()
71 self._config.update(dotenv_values(str(self.project_dir / '.env')))
76 php = nominatim.paths.PHPLIB_DIR
77 sql = nominatim.paths.SQLLIB_DIR
78 data = nominatim.paths.DATA_DIR
80 self.lib_dir = _LibDirs()
81 self._private_plugins: Dict[str, object] = {}
84 def set_libdirs(self, **kwargs: StrPath) -> None:
85 """ Set paths to library functions and data.
87 for key, value in kwargs.items():
88 setattr(self.lib_dir, key, Path(value))
91 def __getattr__(self, name: str) -> str:
92 name = 'NOMINATIM_' + name
94 if name in self.environ:
95 return self.environ[name]
97 return self._config[name] or ''
100 def get_bool(self, name: str) -> bool:
101 """ Return the given configuration parameter as a boolean.
102 Values of '1', 'yes' and 'true' are accepted as truthy values,
103 everything else is interpreted as false.
105 return getattr(self, name).lower() in ('1', 'yes', 'true')
108 def get_int(self, name: str) -> int:
109 """ Return the given configuration parameter as an int.
112 return int(getattr(self, name))
113 except ValueError as exp:
114 LOG.fatal("Invalid setting NOMINATIM_%s. Needs to be a number.", name)
115 raise UsageError("Configuration error.") from exp
118 def get_str_list(self, name: str) -> Optional[List[str]]:
119 """ Return the given configuration parameter as a list of strings.
120 The values are assumed to be given as a comma-sparated list and
121 will be stripped before returning them. On empty values None
124 raw = getattr(self, name)
126 return [v.strip() for v in raw.split(',')] if raw else None
129 def get_path(self, name: str) -> Optional[Path]:
130 """ Return the given configuration parameter as a Path.
131 If a relative path is configured, then the function converts this
132 into an absolute path with the project directory as root path.
133 If the configuration is unset, None is returned.
135 value = getattr(self, name)
139 cfgpath = Path(value)
141 if not cfgpath.is_absolute():
142 assert self.project_dir is not None
143 cfgpath = self.project_dir / cfgpath
145 return cfgpath.resolve()
148 def get_libpq_dsn(self) -> str:
149 """ Get configured database DSN converted into the key/value format
150 understood by libpq and psycopg.
152 dsn = self.DATABASE_DSN
154 def quote_param(param: str) -> str:
155 key, val = param.split('=')
156 val = val.replace('\\', '\\\\').replace("'", "\\'")
158 val = "'" + val + "'"
159 return key + '=' + val
161 if dsn.startswith('pgsql:'):
162 # Old PHP DSN format. Convert before returning.
163 return ' '.join([quote_param(p) for p in dsn[6:].split(';')])
168 def get_database_params(self) -> Mapping[str, str]:
169 """ Get the configured parameters for the database connection
172 dsn = self.DATABASE_DSN
174 if dsn.startswith('pgsql:'):
175 return dict((p.split('=', 1) for p in dsn[6:].split(';')))
177 return parse_dsn(dsn)
180 def get_import_style_file(self) -> Path:
181 """ Return the import style file as a path object. Translates the
182 name of the standard styles automatically into a file in the
185 style = getattr(self, 'IMPORT_STYLE')
187 if style in ('admin', 'street', 'address', 'full', 'extratags'):
188 return self.config_dir / f'import-{style}.lua'
190 return self.find_config_file('', 'IMPORT_STYLE')
193 def get_os_env(self) -> Dict[str, str]:
194 """ Return a copy of the OS environment with the Nominatim configuration
197 env = {k: v for k, v in self._config.items() if v is not None}
198 env.update(self.environ)
203 def load_sub_configuration(self, filename: StrPath,
204 config: Optional[str] = None) -> Any:
205 """ Load additional configuration from a file. `filename` is the name
206 of the configuration file. The file is first searched in the
207 project directory and then in the global settings directory.
209 If `config` is set, then the name of the configuration file can
210 be additionally given through a .env configuration option. When
211 the option is set, then the file will be exclusively loaded as set:
212 if the name is an absolute path, the file name is taken as is,
213 if the name is relative, it is taken to be relative to the
216 The format of the file is determined from the filename suffix.
217 Currently only files with extension '.yaml' are supported.
219 YAML files support a special '!include' construct. When the
220 directive is given, the value is taken to be a filename, the file
221 is loaded using this function and added at the position in the
224 configfile = self.find_config_file(filename, config)
226 if str(configfile) in CONFIG_CACHE:
227 return CONFIG_CACHE[str(configfile)]
229 if configfile.suffix in ('.yaml', '.yml'):
230 result = self._load_from_yaml(configfile)
231 elif configfile.suffix == '.json':
232 with configfile.open('r', encoding='utf-8') as cfg:
233 result = json.load(cfg)
235 raise UsageError(f"Config file '{configfile}' has unknown format.")
237 CONFIG_CACHE[str(configfile)] = result
241 def load_plugin_module(self, module_name: str, internal_path: str) -> Any:
242 """ Load a Python module as a plugin.
244 The module_name may have three variants:
246 * A name without any '.' is assumed to be an internal module
247 and will be searched relative to `internal_path`.
248 * If the name ends in `.py`, module_name is assumed to be a
249 file name relative to the project directory.
250 * Any other name is assumed to be an absolute module name.
252 In either of the variants the module name must start with a letter.
254 if not module_name or not module_name[0].isidentifier():
255 raise UsageError(f'Invalid module name {module_name}')
257 if '.' not in module_name:
258 module_name = module_name.replace('-', '_')
259 full_module = f'{internal_path}.{module_name}'
260 return sys.modules.get(full_module) or importlib.import_module(full_module)
262 if module_name.endswith('.py'):
263 if self.project_dir is None or not (self.project_dir / module_name).exists():
264 raise UsageError(f"Cannot find module '{module_name}' in project directory.")
266 if module_name in self._private_plugins:
267 return self._private_plugins[module_name]
269 file_path = str(self.project_dir / module_name)
270 spec = importlib.util.spec_from_file_location(module_name, file_path)
272 module = importlib.util.module_from_spec(spec)
273 # Do not add to global modules because there is no standard
274 # module name that Python can resolve.
275 self._private_plugins[module_name] = module
276 assert spec.loader is not None
277 spec.loader.exec_module(module)
281 return sys.modules.get(module_name) or importlib.import_module(module_name)
284 def find_config_file(self, filename: StrPath,
285 config: Optional[str] = None) -> Path:
286 """ Resolve the location of a configuration file given a filename and
287 an optional configuration option with the file name.
288 Raises a UsageError when the file cannot be found or is not
291 if config is not None:
292 cfg_value = getattr(self, config)
294 cfg_filename = Path(cfg_value)
296 if cfg_filename.is_absolute():
297 cfg_filename = cfg_filename.resolve()
299 if not cfg_filename.is_file():
300 LOG.fatal("Cannot find config file '%s'.", cfg_filename)
301 raise UsageError("Config file not found.")
305 filename = cfg_filename
308 search_paths = [self.project_dir, self.config_dir]
309 for path in search_paths:
310 if path is not None and (path / filename).is_file():
311 return path / filename
313 LOG.fatal("Configuration file '%s' not found.\nDirectories searched: %s",
314 filename, search_paths)
315 raise UsageError("Config file not found.")
318 def _load_from_yaml(self, cfgfile: Path) -> Any:
319 """ Load a YAML configuration file. This installs a special handler that
320 allows to include other YAML files using the '!include' operator.
322 yaml.add_constructor('!include', self._yaml_include_representer,
323 Loader=yaml.SafeLoader)
324 return yaml.safe_load(cfgfile.read_text(encoding='utf-8'))
327 def _yaml_include_representer(self, loader: Any, node: yaml.Node) -> Any:
328 """ Handler for the '!include' operator in YAML files.
330 When the filename is relative, then the file is first searched in the
331 project directory and then in the global settings directory.
333 fname = loader.construct_scalar(node)
335 if Path(fname).is_absolute():
336 configfile = Path(fname)
338 configfile = self.find_config_file(loader.construct_scalar(node))
340 if configfile.suffix != '.yaml':
341 LOG.fatal("Format error while reading '%s': only YAML format supported.",
343 raise UsageError("Cannot handle config file format.")
345 return yaml.safe_load(configfile.read_text(encoding='utf-8'))