]> git.openstreetmap.org Git - nominatim.git/blob - settings/legacy_icu_tokenizer.yaml
import abbreviations from OSM Wiki
[nominatim.git] / settings / legacy_icu_tokenizer.yaml
1 normalization:
2     - ":: lower ()"
3     - !include icu-rules/unicode-digits-to-decimal.yaml
4     - "'№' > 'no'"
5     - "'n°' > 'no'"
6     - "'nº' > 'no'"
7     - "ª > a"
8     - "º > o"
9     - "[[:Punctuation:][:Symbol:]]  > ' '"
10     - "ß > 'ss'" # German szet is unimbigiously equal to double ss
11     - "[^[:Letter:] [:Number:] [:Space:]] >"
12     - "[:Lm:] >"
13     - ":: [[:Number:]] Latin ()"
14     - ":: [[:Number:]] Ascii ();"
15     - ":: [[:Number:]] NFD ();"
16     - "[[:Nonspacing Mark:] [:Cf:]] >;"
17     - "[:Space:]+ > ' '"
18 transliteration:
19     - ":: Latin ()"
20     - !include icu-rules/extended-unicode-to-asccii.yaml
21     - ":: Ascii ()"
22     - ":: NFD ()"
23     - "[^[:Ascii:]] >"
24     - ":: lower ()"
25     - ":: NFC ()"
26     - "[:Space:]+ > ' '"
27 variants:
28     - !include icu-rules/variants-bg.yaml
29     - !include icu-rules/variants-ca.yaml
30     - !include icu-rules/variants-cs.yaml
31     - !include icu-rules/variants-da.yaml
32     - !include icu-rules/variants-de.yaml
33     - !include icu-rules/variants-el.yaml
34     - !include icu-rules/variants-en.yaml
35     - !include icu-rules/variants-es.yaml
36     - !include icu-rules/variants-et.yaml
37     - !include icu-rules/variants-eu.yaml
38     - !include icu-rules/variants-fi.yaml
39     - !include icu-rules/variants-fr.yaml
40     - !include icu-rules/variants-gl.yaml
41     - !include icu-rules/variants-hu.yaml
42     - !include icu-rules/variants-it.yaml
43     - !include icu-rules/variants-ja.yaml
44     - !include icu-rules/variants-mg.yaml
45     - !include icu-rules/variants-ms.yaml
46     - !include icu-rules/variants-nl.yaml
47     - !include icu-rules/variants-no.yaml
48     - !include icu-rules/variants-pl.yaml
49     - !include icu-rules/variants-pt.yaml
50     - !include icu-rules/variants-ro.yaml
51     - !include icu-rules/variants-ru.yaml
52     - !include icu-rules/variants-sk.yaml
53     - !include icu-rules/variants-sl.yaml
54     - !include icu-rules/variants-sv.yaml
55     - !include icu-rules/variants-tr.yaml
56     - !include icu-rules/variants-uk.yaml
57     - !include icu-rules/variants-vi.yaml