[osm] Stripping standard city prefixes/suffies e.g. Township of

This commit is contained in:
Al
2015-12-05 15:42:22 -05:00
parent 596c5ffdd3
commit 2a4210f93f
2 changed files with 53 additions and 0 deletions

View File

@@ -0,0 +1,31 @@
from __future__ import unicode_literals
import re
from geodata.encoding import safe_decode
name_prefixes = ['{} '.format(s) for s in (
'city of',
'township of',
'municipality of',
'borough of',
'london borough of',
'town of',
)]
name_suffixes = [' {}'.format(s) for s in (
'township',
'municipality',
)]
name_prefix_regex = re.compile('^{}'.format('|'.join(name_prefixes)), re.I | re.UNICODE)
name_suffix_regex = re.compile('{}$'.format('|'.join(name_suffixes)), re.I | re.UNICODE)
def replace_name_prefixes(name):
name = safe_decode(name)
return name_prefix_regex.sub('', name)
def replace_name_suffixes(name):
name = safe_decode(name)
return name_suffix_regex.sub('', name)