Files
libpostal/src/geodb.h

76 lines
2.2 KiB
C

#ifndef GEONAMES_DICTIONARY_H
#define GEONAMES_DICTIONARY_H
#include <stdio.h>
#include <stdlib.h>
#include <stdint.h>
#include "libpostal_config.h"
#include "geonames.h"
#include "graph.h"
#include "sparkey/sparkey.h"
#include "sparkey/sparkey-internal.h"
#include "string_utils.h"
#include "trie.h"
#include "trie_search.h"
#define GEODB_NAMES_TRIE_FILENAME "geodb_names.trie"
#define GEODB_TRIE_FILENAME_LEN strlen(GEODB_NAMES_TRIE_FILENAME)
#define GEODB_FEATURES_TRIE_FILENAME "geodb_features.trie"
#define GEODB_FEATURES_TRIE_FILENAME_LEN strlen(GEODB_FEATURES_TRIE_FILENAME)
#define GEODB_FEATURE_GRAPH_FILENAME "geodb_feature_graph.dat"
#define GEODB_FEATURE_GRAPH_FILENAME_LEN strlen(GEODB_FEATURE_GRAPH_FILENAME)
#define GEODB_POSTAL_CODES_FILENAME "geodb_postal_codes.dat"
#define GEODB_POSTAL_CODES_FILENAME_LEN strlen(GEODB_POSTAL_CODES_FILENAME)
#define GEODB_HASH_FILENAME "geodb.spi"
#define GEODB_HASH_FILENAME_LEN strlen(GEODB_HASH_FILENAME)
#define GEODB_LOG_FILENAME "geodb.spl"
#define GEODB_LOG_FILENAME_LEN strlen(GEODB_LOG_FILENAME)
// Can manipulate the bit-packed values separately, or access the whole value
typedef union geodb_value {
uint32_t value;
struct {
uint32_t is_canonical:1;
uint32_t components:15;
uint32_t count:16;
};
} geodb_value_t;
typedef struct geodb {
trie_t *names;
trie_t *features;
cstring_array *postal_codes;
graph_t *feature_graph;
sparkey_hashreader *hash_reader;
sparkey_logiter *log_iter;
char_array *value_buf;
geoname_t *geoname;
gn_postal_code_t *postal_code;
} geodb_t;
typedef struct gn_geocoding_result {
int start;
int end;
geonames_generic_t result;
} gn_geocoding_result_t;
geodb_t *get_geodb(void);
bool geodb_load(char *dir);
bool geodb_module_setup(char *dir);
void geodb_module_teardown(void);
void geodb_destroy(geodb_t *self);
// Trie search
bool search_geodb_with_phrases(char *str, phrase_array **phrases);
phrase_array *search_geodb(char *str);
bool search_geodb_tokens_with_phrases(char *str, token_array *tokens, phrase_array **phrases);
phrase_array *search_geodb_tokens(char *str, token_array *tokens);
geonames_generic_t *geodb_get_len(char *key, size_t len);
geonames_generic_t *geodb_get(char *key);
#endif