[tokenization] Adding url, email, US/international phone numbers, a separate type for ideographic numbers, more general quotes, paren types

This commit is contained in:
Al
2015-03-24 16:43:53 -04:00
parent 50187f28ce
commit 2d1c24a6e9
4 changed files with 298633 additions and 262454 deletions

View File

@@ -12,11 +12,11 @@ typedef struct scanner {
unsigned char *src, *cursor, *start, *end;
} scanner_t;
int scan_token(scanner_t *s);
uint16_t scan_token(scanner_t *s);
inline scanner_t scanner_from_string(const char *input);
tokenized_string_t *tokenize(const char *str);
token_array *tokenize(const char *input);
#ifdef __cplusplus