libpostal-sys 0.1.1

Low-level wrappers for libpostal address normalization (with locks to support thread-safe initialization)
Documentation
#ifndef GEONAMES_DICTIONARY_H
#define GEONAMES_DICTIONARY_H

#include <stdio.h>
#include <stdlib.h>
#include <stdint.h>

#include "libpostal_config.h"
#include "geonames.h"
#include "graph.h"
#include "sparkey/sparkey.h"
#include "sparkey/sparkey-internal.h"
#include "string_utils.h"
#include "trie.h"
#include "trie_search.h"

#define GEODB_NAMES_TRIE_FILENAME "geodb_names.trie"
#define GEODB_TRIE_FILENAME_LEN strlen(GEODB_NAMES_TRIE_FILENAME)
#define GEODB_FEATURES_TRIE_FILENAME "geodb_features.trie"
#define GEODB_FEATURES_TRIE_FILENAME_LEN strlen(GEODB_FEATURES_TRIE_FILENAME)
#define GEODB_FEATURE_GRAPH_FILENAME "geodb_feature_graph.dat"
#define GEODB_FEATURE_GRAPH_FILENAME_LEN strlen(GEODB_FEATURE_GRAPH_FILENAME)
#define GEODB_POSTAL_CODES_FILENAME "geodb_postal_codes.dat"
#define GEODB_POSTAL_CODES_FILENAME_LEN strlen(GEODB_POSTAL_CODES_FILENAME)
#define GEODB_HASH_FILENAME "geodb.spi"
#define GEODB_HASH_FILENAME_LEN strlen(GEODB_HASH_FILENAME)
#define GEODB_LOG_FILENAME "geodb.spl"
#define GEODB_LOG_FILENAME_LEN strlen(GEODB_LOG_FILENAME)

// Can manipulate the bit-packed values separately, or access the whole value
typedef union geodb_value {
    uint32_t value;
    struct {
        uint32_t is_canonical:1;
        uint32_t components:15;
        uint32_t count:16;
    };
} geodb_value_t;

typedef struct geodb {
    trie_t *names;
    trie_t *features;
    cstring_array *postal_codes;
    graph_t *feature_graph;
    sparkey_hashreader *hash_reader;
    sparkey_logiter *log_iter;
    char_array *value_buf;
    geoname_t *geoname;
    gn_postal_code_t *postal_code;
} geodb_t;

typedef struct gn_geocoding_result {
    int start;
    int end;
    geonames_generic_t result;
} gn_geocoding_result_t;

geodb_t *get_geodb(void);
bool geodb_load(char *dir);

bool geodb_module_setup(char *dir);
void geodb_module_teardown(void);

void geodb_destroy(geodb_t *self);


// Trie search
bool search_geodb_with_phrases(char *str, phrase_array **phrases);
phrase_array *search_geodb(char *str);
bool search_geodb_tokens_with_phrases(char *str, token_array *tokens, phrase_array **phrases);
phrase_array *search_geodb_tokens(char *str, token_array *tokens);

geonames_generic_t *geodb_get_len(char *key, size_t len);
geonames_generic_t *geodb_get(char *key);

#endif