[phrases] Using safe_encode/safe_decode as default trie serializer/deserializer

This commit is contained in:
Al
2016-05-02 15:45:39 -04:00
parent 39700cbb11
commit 3c750a868e
2 changed files with 6 additions and 3 deletions

View File

@@ -1,5 +1,6 @@
import os
import sys
import ujson as json
from collections import defaultdict, OrderedDict
@@ -27,6 +28,8 @@ POSSIBLE_ROMAN_NUMERALS = set(['i', 'ii', 'iii', 'iv', 'v', 'vi', 'vii', 'viii',
class DictionaryPhraseFilter(PhraseFilter):
serialize = safe_encode
deserialize = safe_decode
def __init__(self, *dictionaries):
self.dictionaries = dictionaries

View File

@@ -1,8 +1,8 @@
import six
import ujson as json
from collections import *
from marisa_trie import BytesTrie
from geodata.encoding import safe_encode, safe_decode
SENTINEL = None
@@ -11,8 +11,8 @@ class PhraseFilter(object):
def __init__(self, phrases):
self.trie = [(key, self.serialize(val)) for key, val in six.iteritems(phrases)]
serialize = json.dumps
deserialize = json.loads
serialize = safe_encode
deserialize = safe_decode
def filter(self, tokens):
def return_item(item):