88 lines
3.1 KiB
YAML
88 lines
3.1 KiB
YAML
names:
|
|
keys:
|
|
default: name
|
|
probability: 0.75
|
|
alternatives:
|
|
- alternative: short_name # e.g. NYC
|
|
probability: 0.12
|
|
- alternative: alt_name # e.g. New York (instead of New York City)
|
|
probability: 0.12
|
|
- alternative: official_name # e.g. United Kingdom of Great Britain and Northern Ireland
|
|
probability: 0.01
|
|
|
|
components:
|
|
country:
|
|
keys:
|
|
default: name
|
|
probability: 0.87
|
|
alternatives:
|
|
- alternative: ISO3166-1:alpha2
|
|
probability: 0.02
|
|
- alternative: ISO3166-1:alpha3
|
|
probability: 0.01
|
|
- alternative: short_name
|
|
probability: 0.04
|
|
- alternative: alt_name
|
|
probability: 0.04
|
|
- alternative: int_name
|
|
probability: 0.01
|
|
- alternative: official_name # e.g. United Kingdom of Great Britain and Northern Ireland
|
|
probability: 0.01
|
|
|
|
regex_replacements:
|
|
- country: fr
|
|
pattern: "(?:lyon|paris|marseilles?) ([\\d]+(?:e|er|ème|eme) arrondissement)"
|
|
replace_with_group: 1
|
|
replace_probability: 0.5
|
|
|
|
# This section overrides place names
|
|
exceptions:
|
|
# Boroughs of New York City
|
|
- id: 2552485 # New York County (don't use Manhattan)
|
|
type: relation
|
|
default: name # New York County
|
|
probability: 1.0
|
|
- id: 369518 # Kings County (don't use Brooklyn)
|
|
type: relation
|
|
default: name # Kings County
|
|
probability: 1.0
|
|
- id: 369519 # Queens County (don't use Queens)
|
|
type: relation
|
|
default: name # Queens County
|
|
probability: 1.0
|
|
- id: 2552450 # Bronx County (don't use The Bronx)
|
|
type: relation
|
|
default: name # Bronx County
|
|
probability: 1.0
|
|
- id: 962876 # Richmond County (don't use Staten Island)
|
|
type: relation
|
|
default: name # Richmond County
|
|
probability: 1.0
|
|
- id: 6577227 # Kingston Parish (always use Kingston)
|
|
type: relation
|
|
default: name # Kingston
|
|
probability: 1.0
|
|
- id: 556706 # New Zealand
|
|
type: relation
|
|
default: name:en
|
|
probability: 0.77
|
|
alternatives:
|
|
- alternative: name
|
|
probability: 0.1
|
|
- alternative: ISO3166-1:alpha2
|
|
probability: 0.02
|
|
- alternative: ISO3166-1:alpha3
|
|
probability: 0.01
|
|
- alternative: short_name
|
|
probability: 0.04
|
|
- alternative: alt_name
|
|
probability: 0.04
|
|
- alternative: int_name
|
|
probability: 0.01
|
|
- alternative: official_name
|
|
probability: 0.01
|
|
- id: 2383266 # Melbourne (city center)
|
|
type: relation
|
|
default: alt_name # Melbourne
|
|
probability: 1.0
|