[boundaries] Adding regex replacements for boundary names such as Lyon 2e Arrondissement where putting Lyon is the OSM convention but we might sometimes want just 2e Arrondissement to appear in the training data next to Lyon

This commit is contained in:
Al
2016-08-11 13:09:08 -04:00
parent 10a41309b8
commit 48755ec218
3 changed files with 38 additions and 3 deletions

View File

@@ -29,6 +29,12 @@ names:
- alternative: official_name # e.g. United Kingdom of Great Britain and Northern Ireland
probability: 0.01
regex_replacements:
- country: fr
pattern: "(?:lyon|paris|marseilles) ([\\d]+er? arrondissement)"
replace_with_group: 1
replace_probability: 0.5
# This section overrides place names
exceptions:
# Boroughs of New York City