From 0d2e8387e66e3469b98a97d63e9d5d90be11c8ed Mon Sep 17 00:00:00 2001 From: Al Date: Tue, 31 May 2016 18:29:07 -0400 Subject: [PATCH] [openaddresses] Removing New Zealand city as the field is not specific enough and may conflict with OSM names, needs to be reverse geocoded. Adding cldr country probabilities so we can add localized names/codes given the country --- resources/dictionaries/de/place_names.txt | 1 + resources/parser/data_sets/openaddresses.yaml | 9 ++++++--- 2 files changed, 7 insertions(+), 3 deletions(-) diff --git a/resources/dictionaries/de/place_names.txt b/resources/dictionaries/de/place_names.txt index a62143ab..96ac5670 100644 --- a/resources/dictionaries/de/place_names.txt +++ b/resources/dictionaries/de/place_names.txt @@ -1,3 +1,4 @@ +abteilung|abt altersheim altstoffsammelzentrum|asz|a s z apotheke diff --git a/resources/parser/data_sets/openaddresses.yaml b/resources/parser/data_sets/openaddresses.yaml index 051c76ac..a1b0c7c1 100644 --- a/resources/parser/data_sets/openaddresses.yaml +++ b/resources/parser/data_sets/openaddresses.yaml @@ -1,5 +1,9 @@ global: - reverse_geocode: false + cldr_country_probability: 0.5 + localized_name_probability: 0.7 + iso_alpha_2_code_probability: 0.2 + iso_alpha_3_code_probability: 0.1 + abbreviate_street_probability: 0.3 separate_street_probability: 0.2 abbreviate_unit_probability: 0.3 @@ -40,8 +44,6 @@ countries: component: house_number - field_name: STREET component: road - - field_name: CITY - component: city - field_name: POSTCODE component: postcode files: @@ -55,6 +57,7 @@ countries: - filename: brussels-nl.csv us: + cldr_country_probability: 0.05 subdirs: ca: add: