Files
libpostal/src/address_dictionary.h

84 lines
2.8 KiB
C

#ifndef ADDRESS_DICTIONARY_H
#define ADDRESS_DICTIONARY_H
#include <stdio.h>
#include <stdlib.h>
#include <stdint.h>
#include <stdbool.h>
#include <string.h>
#include "address_expansion_rule.h"
#include "libpostal_config.h"
#include "constants.h"
#include "collections.h"
#include "file_utils.h"
#include "gazetteers.h"
#include "trie.h"
#include "trie_search.h"
#define ALL_LANGUAGES "all"
#define DEFAULT_ADDRESS_EXPANSION_PATH LIBPOSTAL_DATA_DIR PATH_SEPARATOR "address_expansions" PATH_SEPARATOR "address_dictionary.dat"
#define NULL_CANONICAL_INDEX -1
typedef struct address_expansion {
int32_t canonical_index;
char language[MAX_LANGUAGE_LEN];
uint32_t num_dictionaries;
uint16_t dictionary_ids[MAX_DICTIONARY_TYPES];
uint32_t address_components;
bool separable;
} address_expansion_t;
VECTOR_INIT(address_expansion_array, address_expansion_t)
typedef struct address_expansion_value {
uint32_t components;
address_expansion_array *expansions;
} address_expansion_value_t;
address_expansion_value_t *address_expansion_value_new(void);
address_expansion_value_t *address_expansion_value_new_with_expansion(address_expansion_t expansion);
void address_expansion_value_destroy(address_expansion_value_t *self);
VECTOR_INIT_FREE_DATA(address_expansion_value_array, address_expansion_value_t *, address_expansion_value_destroy)
typedef struct address_dictionary {
cstring_array *canonical;
address_expansion_value_array *values;
trie_t *trie;
} address_dictionary_t;
address_dictionary_t *get_address_dictionary(void);
bool address_dictionary_init(void);
phrase_array *search_address_dictionaries(char *str, char *lang);
bool search_address_dictionaries_with_phrases(char *str, char *lang, phrase_array **phrases);
phrase_array *search_address_dictionaries_tokens(char *str, token_array *tokens, char *lang);
bool search_address_dictionaries_tokens_with_phrases(char *str, token_array *tokens, char *lang, phrase_array **phrases);
phrase_t search_address_dictionaries_prefix(char *str, size_t len, char *lang);
phrase_t search_address_dictionaries_suffix(char *str, size_t len, char *lang);
address_expansion_value_t *address_dictionary_get_expansions(uint32_t i);
bool address_expansion_in_dictionary(address_expansion_t expansion, uint16_t dictionary_id);
char *address_dictionary_get_canonical(uint32_t index);
int32_t address_dictionary_next_canonical_index(void);
bool address_dictionary_add_canonical(char *canonical);
bool address_dictionary_add_expansion(char *key, char *language, address_expansion_t expansion);
void address_dictionary_destroy(address_dictionary_t *self);
bool address_dictionary_load(char *path);
bool address_dictionary_save(char *path);
bool address_dictionary_module_setup(char *filename);
void address_dictionary_module_teardown(void);
#endif