[fix] using new pypostal tokenize API
This commit is contained in:
@@ -197,7 +197,7 @@ def disambiguate_language(text, languages):
|
|||||||
read_len += script_len
|
read_len += script_len
|
||||||
|
|
||||||
num_defaults = sum((1 for lang, default in valid_languages.iteritems() if default))
|
num_defaults = sum((1 for lang, default in valid_languages.iteritems() if default))
|
||||||
tokens = [(c, t.rstrip('.')) for c, t in tokenize(safe_decode(text).replace(u'-', u' ').lower())]
|
tokens = [(c, t.rstrip('.')) for t, c in tokenize(safe_decode(text).replace(u'-', u' ').lower())]
|
||||||
|
|
||||||
current_lang = None
|
current_lang = None
|
||||||
possible_lang = None
|
possible_lang = None
|
||||||
|
|||||||
Reference in New Issue
Block a user