[addresses] field combinations, Roman numerals and spellout for Russian config
This commit is contained in:
@@ -24,6 +24,57 @@ components:
|
|||||||
alphanumeric_probability: 0.4
|
alphanumeric_probability: 0.4
|
||||||
|
|
||||||
|
|
||||||
|
combinations:
|
||||||
|
-
|
||||||
|
components:
|
||||||
|
- house_number
|
||||||
|
- staircase
|
||||||
|
- level
|
||||||
|
- unit
|
||||||
|
label: house_number
|
||||||
|
separators:
|
||||||
|
- separator: "/"
|
||||||
|
probability: 0.95
|
||||||
|
- separator: "-"
|
||||||
|
probability: 0.05
|
||||||
|
probability: 0.005
|
||||||
|
-
|
||||||
|
components:
|
||||||
|
- house_number
|
||||||
|
- level
|
||||||
|
- unit
|
||||||
|
label: house_number
|
||||||
|
separators:
|
||||||
|
- separator: "/"
|
||||||
|
probability: 0.95
|
||||||
|
- separator: "-"
|
||||||
|
probability: 0.05
|
||||||
|
probability: 0.005
|
||||||
|
-
|
||||||
|
components:
|
||||||
|
- house_number
|
||||||
|
- level
|
||||||
|
label: house_number
|
||||||
|
separators:
|
||||||
|
- separator: "/"
|
||||||
|
probability: 0.95
|
||||||
|
- separator: "-"
|
||||||
|
probability: 0.05
|
||||||
|
probability: 0.01
|
||||||
|
# For unit types like 2/34
|
||||||
|
-
|
||||||
|
components:
|
||||||
|
- house_number
|
||||||
|
- unit
|
||||||
|
label: house_number
|
||||||
|
separators:
|
||||||
|
- separator: "/"
|
||||||
|
probability: 0.95
|
||||||
|
- separator: "-"
|
||||||
|
probability: 0.05
|
||||||
|
probability: 0.005
|
||||||
|
|
||||||
|
|
||||||
numbers:
|
numbers:
|
||||||
default: &nomer
|
default: &nomer
|
||||||
canonical: номер
|
canonical: номер
|
||||||
@@ -175,10 +226,15 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
roman_numeral_probability: 0.1
|
||||||
|
spellout_probability: 0.1
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
digits:
|
digits:
|
||||||
ascii_probability: 0.8
|
ascii_probability: 0.5
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
spellout_probability: 0.2
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
@@ -192,8 +248,16 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
roman_numeral_probability: 0.1
|
||||||
|
spellout_probability: 0.1
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.5
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
uroven: &uroven
|
uroven: &uroven
|
||||||
@@ -204,8 +268,16 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
roman_numeral_probability: 0.1
|
||||||
|
spellout_probability: 0.1
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.5
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
uroven_latin: &uroven_latin
|
uroven_latin: &uroven_latin
|
||||||
@@ -216,8 +288,16 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
roman_numeral_probability: 0.1
|
||||||
|
spellout_probability: 0.1
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.5
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
pervyy_etazh: &pervyy_etazh
|
pervyy_etazh: &pervyy_etazh
|
||||||
@@ -267,8 +347,6 @@ levels:
|
|||||||
direction: left
|
direction: left
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
ordinal:
|
|
||||||
direction: right
|
|
||||||
number_abs_value: true
|
number_abs_value: true
|
||||||
number_min_abs_value: 2
|
number_min_abs_value: 2
|
||||||
# Basement 2 == Sub-basement 1
|
# Basement 2 == Sub-basement 1
|
||||||
@@ -290,8 +368,6 @@ levels:
|
|||||||
direction: left
|
direction: left
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
ordinal:
|
|
||||||
direction: right
|
|
||||||
number_abs_value: true
|
number_abs_value: true
|
||||||
number_min_abs_value: 2
|
number_min_abs_value: 2
|
||||||
# Basement 2 == Sub-basement 1
|
# Basement 2 == Sub-basement 1
|
||||||
@@ -345,7 +421,8 @@ levels:
|
|||||||
probability: 0.09
|
probability: 0.09
|
||||||
- alternative: *uroven_latin
|
- alternative: *uroven_latin
|
||||||
probability: 0.01
|
probability: 0.01
|
||||||
numeric_probability: 0.99 # With this probability, pick an integer
|
numeric_probability: 0.79 # With this probability, pick an integer
|
||||||
|
roman_numeral_probability: 0.2
|
||||||
alpha_probability: 0.0098 # With this probability, pick a letter e.g. A
|
alpha_probability: 0.0098 # With this probability, pick a letter e.g. A
|
||||||
numeric_plus_alpha_probability: 0.0001 # e.g. 2A
|
numeric_plus_alpha_probability: 0.0001 # e.g. 2A
|
||||||
alpha_plus_numeric_probability: 0.0001 # e.g. A2
|
alpha_plus_numeric_probability: 0.0001 # e.g. A2
|
||||||
|
|||||||
Reference in New Issue
Block a user