From 3ff472c8cfa79ccac1ebac19635a5c1bfb40c58b Mon Sep 17 00:00:00 2001 From: Al Date: Tue, 6 Dec 2016 22:50:14 -0500 Subject: [PATCH] [openaddresses] fixing house numbers with multiple consecutive hyphens --- scripts/geodata/openaddresses/formatter.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/scripts/geodata/openaddresses/formatter.py b/scripts/geodata/openaddresses/formatter.py index 97758e84..a099ee4e 100644 --- a/scripts/geodata/openaddresses/formatter.py +++ b/scripts/geodata/openaddresses/formatter.py @@ -54,6 +54,8 @@ class OpenAddressesFormatter(object): AddressFormatter.HOUSE_NUMBER: [ # Most of the house numbers in Montreal start with "#" (re.compile('^#', re.UNICODE), six.u('')), + # Some house numbers have multiple hyphens + (re.compile('[\-]{2,}'), six.u('-')), # Some house number ranges are split up like "12 -14" (re.compile('[\s]*\-[\s]*'), six.u('-')), ]