[tokenization/trie] simpler url regex reduces the scanner file size, accounting for a few more variations in word tokens, making trie suffix search use iteration instead of malloc'ing a new string
This commit is contained in:
@@ -10,6 +10,7 @@ extern "C" {
|
||||
#include "collections.h"
|
||||
#include "klib/kvec.h"
|
||||
#include "log/log.h"
|
||||
#include "string_utils.h"
|
||||
#include "tokens.h"
|
||||
#include "vector.h"
|
||||
#include "utf8proc/utf8proc.h"
|
||||
|
||||
Reference in New Issue
Block a user