[transliteration] For ruleset steps in transliteration, the name is just the step number, which can be appended to the trie as part of the key

This commit is contained in:
Al
2015-04-29 14:31:15 -04:00
parent 1c25238af7
commit fa43abd8d9
2 changed files with 53 additions and 53 deletions

View File

@@ -6849,78 +6849,78 @@ transliteration_rule_source_t rules_source[] = {
transliteration_step_source_t steps_source[] = {
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,0,103,NULL},
{STEP_RULESET,0,103,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,103,67,NULL},
{STEP_RULESET,170,1,NULL},
{STEP_RULESET,103,67,"1"},
{STEP_RULESET,170,1,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFKC"},
{STEP_RULESET,171,90,NULL},
{STEP_RULESET,261,47,NULL},
{STEP_RULESET,171,90,"1"},
{STEP_RULESET,261,47,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,308,88,NULL},
{STEP_RULESET,308,88,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Gujarati-InterIndic"},
{STEP_TRANSFORM,-1,-1,"InterIndic-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,396,82,NULL},
{STEP_RULESET,396,82,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFKD"},
{STEP_RULESET,478,107,NULL},
{STEP_RULESET,478,107,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_RULESET,585,45,NULL},
{STEP_RULESET,630,76,NULL},
{STEP_RULESET,585,45,"0"},
{STEP_RULESET,630,76,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_RULESET,706,95,NULL},
{STEP_RULESET,706,95,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,801,74,NULL},
{STEP_RULESET,801,74,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,875,268,NULL},
{STEP_RULESET,875,268,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Devanagari-InterIndic"},
{STEP_TRANSFORM,-1,-1,"InterIndic-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,1143,49,NULL},
{STEP_RULESET,1192,3,NULL},
{STEP_RULESET,1143,49,"1"},
{STEP_RULESET,1192,3,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,1195,114,NULL},
{STEP_RULESET,1195,114,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,1309,63,NULL},
{STEP_RULESET,1309,63,"1"},
{STEP_TRANSFORM,-1,-1,"Han-Spacedhan"},
{STEP_RULESET,1372,1597,NULL},
{STEP_RULESET,1372,1597,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,2969,114,NULL},
{STEP_RULESET,2969,114,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFKD"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_RULESET,3083,92,NULL},
{STEP_RULESET,3083,92,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,3175,33,NULL},
{STEP_RULESET,3175,33,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,3208,298,NULL},
{STEP_RULESET,3506,342,NULL},
{STEP_RULESET,3848,83,NULL},
{STEP_RULESET,3208,298,"1"},
{STEP_RULESET,3506,342,"0"},
{STEP_RULESET,3848,83,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,3931,87,NULL},
{STEP_RULESET,3931,87,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,4018,116,NULL},
{STEP_RULESET,4018,116,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Tamil-InterIndic"},
{STEP_TRANSFORM,-1,-1,"InterIndic-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_RULESET,4134,64,NULL},
{STEP_RULESET,4134,64,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,4198,70,NULL},
{STEP_RULESET,4198,70,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Telugu-InterIndic"},
{STEP_TRANSFORM,-1,-1,"InterIndic-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_RULESET,4268,35,NULL},
{STEP_RULESET,4268,35,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,4303,322,NULL},
{STEP_RULESET,4625,83,NULL},
{STEP_RULESET,4303,322,"1"},
{STEP_RULESET,4625,83,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,4708,96,NULL},
{STEP_RULESET,4708,96,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Hiragana-Katakana"},
@@ -6930,7 +6930,7 @@ transliteration_step_source_t steps_source[] = {
{STEP_TRANSFORM,-1,-1,"InterIndic-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFKD"},
{STEP_RULESET,4804,108,NULL},
{STEP_RULESET,4804,108,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Kannada-InterIndic"},
@@ -6943,47 +6943,47 @@ transliteration_step_source_t steps_source[] = {
{STEP_TRANSFORM,-1,-1,"ThaiLogical-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,4912,97,NULL},
{STEP_RULESET,4912,97,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Oriya-InterIndic"},
{STEP_TRANSFORM,-1,-1,"InterIndic-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,5009,137,NULL},
{STEP_RULESET,5009,137,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,5146,101,NULL},
{STEP_RULESET,5146,101,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,5247,190,NULL},
{STEP_RULESET,5247,190,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFKD"},
{STEP_RULESET,5437,84,NULL},
{STEP_RULESET,5437,84,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Malayalam-InterIndic"},
{STEP_TRANSFORM,-1,-1,"InterIndic-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_RULESET,5521,106,NULL},
{STEP_RULESET,5521,106,"0"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,5627,79,NULL},
{STEP_RULESET,5627,79,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_TRANSFORM,-1,-1,"Gurmukhi-InterIndic"},
{STEP_TRANSFORM,-1,-1,"InterIndic-Latin"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFD"},
{STEP_RULESET,5706,1,NULL},
{STEP_RULESET,5706,1,"1"},
{STEP_UNICODE_NORMALIZATION,-1,-1,"NFC"},
{STEP_RULESET,5707,681,NULL},
{STEP_RULESET,6388,6,NULL},
{STEP_RULESET,6394,86,NULL},
{STEP_RULESET,6480,81,NULL},
{STEP_RULESET,6561,75,NULL},
{STEP_RULESET,6636,1,NULL},
{STEP_RULESET,5707,681,"3"},
{STEP_RULESET,6388,6,"0"},
{STEP_RULESET,6394,86,"1"},
{STEP_RULESET,6480,81,"0"},
{STEP_RULESET,6561,75,"0"},
{STEP_RULESET,6636,1,"0"},
{STEP_TRANSFORM,-1,-1,"Han-Spacedhan"},
{STEP_RULESET,6637,38,NULL},
{STEP_RULESET,6675,2,NULL},
{STEP_RULESET,6637,38,"2"},
{STEP_RULESET,6675,2,"3"},
{STEP_TRANSFORM,-1,-1,"Han-Latin"},
{STEP_RULESET,6677,86,NULL},
{STEP_RULESET,6763,81,NULL}
{STEP_RULESET,6677,86,"0"},
{STEP_RULESET,6763,81,"0"}
};
transliterator_source_t transliterators_source[] = {