From d51a1d61964b1cb8fe9d0e7c21bcf1727b6c30f8 Mon Sep 17 00:00:00 2001 From: Al Date: Fri, 21 Oct 2016 22:02:15 -0400 Subject: [PATCH] [addresses] doing hyphenation for existing components in component expansion (i.e. OSM training data) --- scripts/geodata/addresses/components.py | 10 +++++++++- 1 file changed, 9 insertions(+), 1 deletion(-) diff --git a/scripts/geodata/addresses/components.py b/scripts/geodata/addresses/components.py index 307e0b6f..ef0fdb08 100644 --- a/scripts/geodata/addresses/components.py +++ b/scripts/geodata/addresses/components.py @@ -1392,7 +1392,7 @@ class AddressComponents(object): def expanded(self, address_components, latitude, longitude, language=None, dropout_places=True, population=None, population_from_city=False, - add_sub_building_components=True, + add_sub_building_components=True, hyphenation=True, num_floors=None, num_basements=None, zone=None): ''' Expanded components @@ -1411,6 +1411,14 @@ class AddressComponents(object): except Exception: return None, None, None + if hyphenation: + for component in address_components: + if component in place_config.ADMIN_COMPONENTS: + value = address_components[component] + value_hyphens = self.name_hyphens(value) + if value_hyphens != value: + address_components[component] = value_hyphens + osm_components = self.osm_reverse_geocoded_components(latitude, longitude) country, candidate_languages = self.osm_country_and_languages(osm_components) if not (country and candidate_languages):