[fix] IDEOGRAM class name
This commit is contained in:
@@ -12,6 +12,8 @@ extern "C" {
|
||||
// Word types
|
||||
#define WORD 1 // Any letter-only word (includes all unicode letters)
|
||||
#define ABBREVIATION 2 // Loose abbreviations (ending in ".")
|
||||
#define IDEOGRAM 3 // For languages that don't separate on whitespace (e.g. Chinese, Japanese, Korean), separate by character
|
||||
#define PHRASE 4 // Not part of the first stage tokenizer, but may be used after phrase parsing
|
||||
|
||||
// Numbers and numeric types
|
||||
#define NUMBER 50 // All digits
|
||||
|
||||
Reference in New Issue
Block a user