[addresses] Adding digit spellout and the list form of field combinations to existing configs
This commit is contained in:
@@ -100,12 +100,16 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
add_number_phrase: true
|
add_number_phrase: true
|
||||||
add_number_phrase_probability: 0.1
|
add_number_phrase_probability: 0.1
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.7
|
digits:
|
||||||
|
ascii_probability: 0.3
|
||||||
|
roman_numeral_probability: 0.7
|
||||||
add_number_phrase: true
|
add_number_phrase: true
|
||||||
add_number_phrase_probability: 0.1
|
add_number_phrase_probability: 0.1
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
@@ -120,10 +124,14 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
etaz: &etaz
|
etaz: &etaz
|
||||||
@@ -134,10 +142,14 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
prizemi: &prizemi
|
prizemi: &prizemi
|
||||||
@@ -163,7 +175,9 @@ levels:
|
|||||||
# e.g. 1. podzemní podlaží
|
# e.g. 1. podzemní podlaží
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
standalone_probability: 0.985
|
standalone_probability: 0.985
|
||||||
number_abs_value: true
|
number_abs_value: true
|
||||||
number_min_abs_value: 1
|
number_min_abs_value: 1
|
||||||
|
|||||||
@@ -21,7 +21,7 @@ components:
|
|||||||
alphanumeric_probability: 0.25
|
alphanumeric_probability: 0.25
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
level_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- level
|
- level
|
||||||
- unit
|
- unit
|
||||||
@@ -32,7 +32,7 @@ components:
|
|||||||
- separator: " - "
|
- separator: " - "
|
||||||
probability: 0.1
|
probability: 0.1
|
||||||
probability: 0.005
|
probability: 0.005
|
||||||
entrance_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- entrance
|
- entrance
|
||||||
- unit
|
- unit
|
||||||
@@ -121,6 +121,9 @@ levels:
|
|||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
etage: &etage
|
etage: &etage
|
||||||
@@ -132,6 +135,9 @@ levels:
|
|||||||
direction: right
|
direction: right
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
stuen: &stuen
|
stuen: &stuen
|
||||||
|
|||||||
@@ -26,7 +26,7 @@ components:
|
|||||||
combinations:
|
combinations:
|
||||||
# e.g. 2/34, more common way to specify a unit number in German
|
# e.g. 2/34, more common way to specify a unit number in German
|
||||||
# if unit exists in the first place
|
# if unit exists in the first place
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
@@ -117,6 +117,9 @@ levels:
|
|||||||
direction: right
|
direction: right
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.3
|
numeric_probability: 0.3
|
||||||
numeric_affix_probability: 0.5
|
numeric_affix_probability: 0.5
|
||||||
ordinal_probability: 0.2
|
ordinal_probability: 0.2
|
||||||
@@ -129,6 +132,9 @@ levels:
|
|||||||
direction: right
|
direction: right
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
stock: &stock
|
stock: &stock
|
||||||
@@ -140,6 +146,9 @@ levels:
|
|||||||
direction: right
|
direction: right
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.1
|
numeric_probability: 0.1
|
||||||
ordinal_probability: 0.9
|
ordinal_probability: 0.9
|
||||||
erdgeschoss: &erdgeschoss
|
erdgeschoss: &erdgeschoss
|
||||||
@@ -613,29 +622,8 @@ countries:
|
|||||||
|
|
||||||
# Combined apartment numbers are very common
|
# Combined apartment numbers are very common
|
||||||
combinations:
|
combinations:
|
||||||
# e.g. Neubaugasse 55/5
|
|
||||||
house_number_unit:
|
|
||||||
probability: 0.7
|
|
||||||
separators:
|
|
||||||
- separator: /
|
|
||||||
probability: 0.98
|
|
||||||
- separator: "-"
|
|
||||||
probability: 0.02
|
|
||||||
# e.g. Neubaugasse 55/1/5
|
|
||||||
house_number_staircase_unit:
|
|
||||||
components:
|
|
||||||
- house_number
|
|
||||||
- staircase
|
|
||||||
- unit
|
|
||||||
label: house_number
|
|
||||||
separators:
|
|
||||||
- separator: /
|
|
||||||
probability: 0.98
|
|
||||||
- separator: "-"
|
|
||||||
probability: 0.02
|
|
||||||
probability: 0.8
|
|
||||||
# e.g. Neubaugasse 55/A/1/5
|
# e.g. Neubaugasse 55/A/1/5
|
||||||
house_number_entrance_staircase_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- entrance
|
- entrance
|
||||||
@@ -648,6 +636,31 @@ countries:
|
|||||||
- separator: "-"
|
- separator: "-"
|
||||||
probability: 0.02
|
probability: 0.02
|
||||||
probability: 0.9
|
probability: 0.9
|
||||||
|
# e.g. Neubaugasse 55/1/5
|
||||||
|
-
|
||||||
|
components:
|
||||||
|
- house_number
|
||||||
|
- staircase
|
||||||
|
- unit
|
||||||
|
label: house_number
|
||||||
|
separators:
|
||||||
|
- separator: /
|
||||||
|
probability: 0.98
|
||||||
|
- separator: "-"
|
||||||
|
probability: 0.02
|
||||||
|
probability: 0.8
|
||||||
|
# e.g. Neubaugasse 55/5
|
||||||
|
-
|
||||||
|
components:
|
||||||
|
- house_number
|
||||||
|
- unit
|
||||||
|
label: house_number
|
||||||
|
probability: 0.7
|
||||||
|
separators:
|
||||||
|
- separator: /
|
||||||
|
probability: 0.98
|
||||||
|
- separator: "-"
|
||||||
|
probability: 0.02
|
||||||
|
|
||||||
units:
|
units:
|
||||||
top: &top
|
top: &top
|
||||||
|
|||||||
@@ -65,7 +65,7 @@ components:
|
|||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
# For unit types like 2/34 (more common in Canada and Australia)
|
# For unit types like 2/34 (more common in Canada and Australia)
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
@@ -160,9 +160,12 @@ levels:
|
|||||||
numeric_affix:
|
numeric_affix:
|
||||||
affix: /f
|
affix: /f
|
||||||
direction: right # affix goes to number's right (always)
|
direction: right # affix goes to number's right (always)
|
||||||
# e.g. 1st Floor
|
# e.g. 1st Floor
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right # canonical or abbreviated form goes to the ordinal's right
|
direction: right # canonical or abbreviated form goes to the ordinal's right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
# Probabilities
|
# Probabilities
|
||||||
numeric_probability: 0.75 # Use the simple number e.g. Floor 1 (or Floor No. 1)
|
numeric_probability: 0.75 # Use the simple number e.g. Floor 1 (or Floor No. 1)
|
||||||
numeric_affix_probability: 0.05 # Use the 2/F (less common)
|
numeric_affix_probability: 0.05 # Use the 2/F (less common)
|
||||||
@@ -1356,9 +1359,7 @@ countries:
|
|||||||
ca:
|
ca:
|
||||||
components:
|
components:
|
||||||
combinations:
|
combinations:
|
||||||
house_number_unit:
|
-
|
||||||
probability: 0.0
|
|
||||||
unit_house_number:
|
|
||||||
components:
|
components:
|
||||||
- unit
|
- unit
|
||||||
- house_number
|
- house_number
|
||||||
|
|||||||
@@ -108,6 +108,9 @@ levels:
|
|||||||
direction: right
|
direction: right
|
||||||
direction_probability: 0.95 # Let it vary occasionally e.g. Piso 2o
|
direction_probability: 0.95 # Let it vary occasionally e.g. Piso 2o
|
||||||
standalone_probability: 0.2 # Let e.g. 5º be the entire floor string
|
standalone_probability: 0.2 # Let e.g. 5º be the entire floor string
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.6
|
numeric_probability: 0.6
|
||||||
numeric_affix_probability: 0.05
|
numeric_affix_probability: 0.05
|
||||||
ordinal_probability: 0.35
|
ordinal_probability: 0.35
|
||||||
@@ -954,6 +957,9 @@ countries:
|
|||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
gender: f
|
gender: f
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
canonical_probability: 0.6
|
canonical_probability: 0.6
|
||||||
abbreviated_probability: 0.2
|
abbreviated_probability: 0.2
|
||||||
sample_probability: 0.2
|
sample_probability: 0.2
|
||||||
|
|||||||
@@ -21,7 +21,7 @@ components:
|
|||||||
alphanumeric_probability: 0.25
|
alphanumeric_probability: 0.25
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
|
|||||||
@@ -21,7 +21,7 @@ components:
|
|||||||
alphanumeric_probability: 0.25
|
alphanumeric_probability: 0.25
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
staircase_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- staircase
|
- staircase
|
||||||
- unit
|
- unit
|
||||||
@@ -107,6 +107,9 @@ levels:
|
|||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
|
|
||||||
|
|||||||
@@ -21,7 +21,7 @@ components:
|
|||||||
alphanumeric_probability: 0.2
|
alphanumeric_probability: 0.2
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
@@ -93,6 +93,9 @@ levels:
|
|||||||
add_number_phrase_probability: 0.05
|
add_number_phrase_probability: 0.05
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.75
|
numeric_probability: 0.75
|
||||||
ordinal_probability: 0.25
|
ordinal_probability: 0.25
|
||||||
niveau: &niveau
|
niveau: &niveau
|
||||||
@@ -106,6 +109,9 @@ levels:
|
|||||||
add_number_phrase_probability: 0.05
|
add_number_phrase_probability: 0.05
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.75
|
numeric_probability: 0.75
|
||||||
ordinal_probability: 0.25
|
ordinal_probability: 0.25
|
||||||
bel_etage: &bel_etage
|
bel_etage: &bel_etage
|
||||||
@@ -889,9 +895,7 @@ countries:
|
|||||||
null_probability: 0.6
|
null_probability: 0.6
|
||||||
alphanumeric_probability: 0.4
|
alphanumeric_probability: 0.4
|
||||||
combinations:
|
combinations:
|
||||||
house_number_unit:
|
-
|
||||||
probability: 0.0
|
|
||||||
unit_house_number:
|
|
||||||
components:
|
components:
|
||||||
- unit
|
- unit
|
||||||
- house_number
|
- house_number
|
||||||
|
|||||||
@@ -13,17 +13,19 @@ components:
|
|||||||
alphanumeric_probability: 0.25
|
alphanumeric_probability: 0.25
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
level_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- level
|
- level
|
||||||
- unit
|
- unit
|
||||||
label: unit
|
label: unit
|
||||||
separators:
|
separators:
|
||||||
- separator: "/"
|
- separator: "/"
|
||||||
probability: 0.95
|
probability: 0.55
|
||||||
|
- separator: " "
|
||||||
|
probability: 0.4
|
||||||
- separator: "-"
|
- separator: "-"
|
||||||
probability: 0.05
|
probability: 0.05
|
||||||
probability: 0.5
|
probability: 0.8
|
||||||
|
|
||||||
|
|
||||||
numbers:
|
numbers:
|
||||||
@@ -100,6 +102,9 @@ levels:
|
|||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.2
|
||||||
|
roman_numeral_probability: 0.8
|
||||||
numeric_probability: 0.1
|
numeric_probability: 0.1
|
||||||
ordinal_probability: 0.9
|
ordinal_probability: 0.9
|
||||||
foldszint: &foldszint
|
foldszint: &foldszint
|
||||||
@@ -220,8 +225,8 @@ levels:
|
|||||||
|
|
||||||
alphanumeric:
|
alphanumeric:
|
||||||
default: *emelet
|
default: *emelet
|
||||||
roman_numeral_probability: 0.8 # With this probability, pick a Roman numeral
|
numeric_probability: 0.59 # With this probability, pick an integer
|
||||||
numeric_probability: 0.19 # With this probability, pick an integer
|
roman_numeral_probability: 0.4 # Pick a Roman numeral for the actual value
|
||||||
alpha_probability: 0.0098 # With this probability, pick a letter e.g. A
|
alpha_probability: 0.0098 # With this probability, pick a letter e.g. A
|
||||||
numeric_plus_alpha_probability: 0.0001 # e.g. 2A
|
numeric_plus_alpha_probability: 0.0001 # e.g. 2A
|
||||||
alpha_plus_numeric_probability: 0.0001 # e.g. A2
|
alpha_plus_numeric_probability: 0.0001 # e.g. A2
|
||||||
|
|||||||
@@ -22,7 +22,7 @@ components:
|
|||||||
alphanumeric_probability: 0.2
|
alphanumeric_probability: 0.2
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
@@ -87,10 +87,15 @@ levels:
|
|||||||
direction_probability: 0.95
|
direction_probability: 0.95
|
||||||
add_number_phrase: true
|
add_number_phrase: true
|
||||||
add_number_phrase_probability: 0.05
|
add_number_phrase_probability: 0.05
|
||||||
roman_numeral_probability: 0.1
|
digits:
|
||||||
|
ascii_probability: 0.9
|
||||||
|
roman_numeral_probability: 0.1
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.5
|
||||||
|
spellout_probability: 0.2
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
numeric_probability: 0.55
|
numeric_probability: 0.55
|
||||||
ordinal_probability: 0.45
|
ordinal_probability: 0.45
|
||||||
livello: &livello
|
livello: &livello
|
||||||
@@ -104,7 +109,9 @@ levels:
|
|||||||
add_number_phrase_probability: 0.05
|
add_number_phrase_probability: 0.05
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
numeric_probability: 0.75
|
numeric_probability: 0.75
|
||||||
ordinal_probability: 0.25
|
ordinal_probability: 0.25
|
||||||
piano_nobile: &piano_nobile
|
piano_nobile: &piano_nobile
|
||||||
|
|||||||
@@ -24,7 +24,7 @@ components:
|
|||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
# Unit is just appended onto the house number
|
# Unit is just appended onto the house number
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
|
|||||||
@@ -23,7 +23,7 @@ components:
|
|||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
# Unit is just appended onto the house number
|
# Unit is just appended onto the house number
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
|
|||||||
@@ -22,7 +22,7 @@ components:
|
|||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
# Bolignummer
|
# Bolignummer
|
||||||
level_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- level
|
- level
|
||||||
- unit
|
- unit
|
||||||
@@ -110,6 +110,9 @@ levels:
|
|||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
hovedetasje: &hovedetasje
|
hovedetasje: &hovedetasje
|
||||||
|
|||||||
@@ -22,7 +22,7 @@ components:
|
|||||||
alphanumeric_probability: 0.2
|
alphanumeric_probability: 0.2
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
@@ -72,10 +72,17 @@ levels:
|
|||||||
verdieping: &verdieping
|
verdieping: &verdieping
|
||||||
canonical: verdieping
|
canonical: verdieping
|
||||||
sample: true
|
sample: true
|
||||||
canonical_probability: 0.8
|
canonical_probability: 0.9
|
||||||
sample_probability: 0.2
|
sample_probability: 0.1
|
||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
|
ordinal:
|
||||||
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
|
numeric_probability: 0.7
|
||||||
|
ordinal_probability: 0.3
|
||||||
etage: &etage
|
etage: &etage
|
||||||
canonical: etage
|
canonical: etage
|
||||||
abbreviated: et
|
abbreviated: et
|
||||||
@@ -85,12 +92,19 @@ levels:
|
|||||||
sample_probability: 0.2
|
sample_probability: 0.2
|
||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
|
ordinal:
|
||||||
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
|
numeric_probability: 0.7
|
||||||
|
ordinal_probability: 0.3
|
||||||
begane_grond: &begane_grond
|
begane_grond: &begane_grond
|
||||||
canonical: begane grond
|
canonical: begane grond
|
||||||
abbreviated: bg
|
abbreviated: bg
|
||||||
sample: true
|
sample: true
|
||||||
canonical_probability: 0.5
|
canonical_probability: 0.5
|
||||||
sample_probability: 0.2
|
abbreviated_probability: 0.2
|
||||||
sample_probability: 0.3
|
sample_probability: 0.3
|
||||||
benedenverdieping: &benedenverdieping
|
benedenverdieping: &benedenverdieping
|
||||||
canonical: benedenverdieping
|
canonical: benedenverdieping
|
||||||
@@ -114,11 +128,11 @@ levels:
|
|||||||
sample_probability: 0.2
|
sample_probability: 0.2
|
||||||
aliases:
|
aliases:
|
||||||
"0":
|
"0":
|
||||||
default: *benedenverdieping
|
default: *begane_grond
|
||||||
probability: 0.5
|
probability: 0.6
|
||||||
alternatives:
|
alternatives:
|
||||||
- alternative: *begane_grond
|
- alternative: *benedenverdieping
|
||||||
probability: 0.45
|
probability: 0.35
|
||||||
- alternative: *parterre
|
- alternative: *parterre
|
||||||
probability: 0.04
|
probability: 0.04
|
||||||
- alternative: *het_gelijkvloers
|
- alternative: *het_gelijkvloers
|
||||||
@@ -497,6 +511,13 @@ countries:
|
|||||||
sample_probability: 0.2
|
sample_probability: 0.2
|
||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
|
ordinal:
|
||||||
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
|
numeric_probability: 0.7
|
||||||
|
ordinal_probability: 0.3
|
||||||
|
|
||||||
aliases:
|
aliases:
|
||||||
"0":
|
"0":
|
||||||
|
|||||||
@@ -21,7 +21,7 @@ components:
|
|||||||
alphanumeric_probability: 0.25
|
alphanumeric_probability: 0.25
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
house_number_unit:
|
-
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- unit
|
- unit
|
||||||
@@ -128,10 +128,14 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.7
|
digits:
|
||||||
|
ascii_probability: 0.3
|
||||||
|
roman_numeral_probability: 0.7
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
parter: &parter
|
parter: &parter
|
||||||
@@ -152,7 +156,9 @@ levels:
|
|||||||
# e.g. 1. suterena
|
# e.g. 1. suterena
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
standalone_probability: 0.985
|
standalone_probability: 0.985
|
||||||
number_abs_value: true
|
number_abs_value: true
|
||||||
number_min_abs_value: 1
|
number_min_abs_value: 1
|
||||||
|
|||||||
@@ -25,35 +25,7 @@ components:
|
|||||||
|
|
||||||
|
|
||||||
combinations:
|
combinations:
|
||||||
# For unit types like 2/34 (more common in Canada and Australia)
|
-
|
||||||
house_number_unit:
|
|
||||||
components:
|
|
||||||
- house_number
|
|
||||||
- unit
|
|
||||||
label: house_number
|
|
||||||
separators:
|
|
||||||
- separator: "-"
|
|
||||||
probability: 0.9
|
|
||||||
- separator: " - "
|
|
||||||
probability: 0.05
|
|
||||||
- separator: /
|
|
||||||
probability: 0.05
|
|
||||||
probability: 0.005
|
|
||||||
house_number_floor:
|
|
||||||
components:
|
|
||||||
- house_number
|
|
||||||
- unit
|
|
||||||
label: house_number
|
|
||||||
separators:
|
|
||||||
- separator: "-"
|
|
||||||
probability: 0.9
|
|
||||||
- separator: " - "
|
|
||||||
probability: 0.05
|
|
||||||
- separator: /
|
|
||||||
probability: 0.05
|
|
||||||
probability: 0.005
|
|
||||||
|
|
||||||
house_number_staircase_unit:
|
|
||||||
components:
|
components:
|
||||||
- house_number
|
- house_number
|
||||||
- staircase
|
- staircase
|
||||||
@@ -67,6 +39,33 @@ components:
|
|||||||
- separator: /
|
- separator: /
|
||||||
probability: 0.05
|
probability: 0.05
|
||||||
probability: 0.005
|
probability: 0.005
|
||||||
|
# For unit types like 2/34 (more common in Canada and Australia)
|
||||||
|
-
|
||||||
|
components:
|
||||||
|
- house_number
|
||||||
|
- unit
|
||||||
|
label: house_number
|
||||||
|
separators:
|
||||||
|
- separator: "-"
|
||||||
|
probability: 0.9
|
||||||
|
- separator: " - "
|
||||||
|
probability: 0.05
|
||||||
|
- separator: /
|
||||||
|
probability: 0.05
|
||||||
|
probability: 0.005
|
||||||
|
-
|
||||||
|
components:
|
||||||
|
- house_number
|
||||||
|
- level
|
||||||
|
label: house_number
|
||||||
|
separators:
|
||||||
|
- separator: "-"
|
||||||
|
probability: 0.9
|
||||||
|
- separator: " - "
|
||||||
|
probability: 0.05
|
||||||
|
- separator: /
|
||||||
|
probability: 0.05
|
||||||
|
probability: 0.005
|
||||||
|
|
||||||
|
|
||||||
numbers:
|
numbers:
|
||||||
@@ -134,6 +133,9 @@ levels:
|
|||||||
standalone_probability: 0.2 # Let e.g. 5º be the entire floor string
|
standalone_probability: 0.2 # Let e.g. 5º be the entire floor string
|
||||||
# If ordinal is selected, chance of e.g. just using 2o without Andar
|
# If ordinal is selected, chance of e.g. just using 2o without Andar
|
||||||
null_phrase_probability: 0.6
|
null_phrase_probability: 0.6
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.2
|
numeric_probability: 0.2
|
||||||
ordinal_probability: 0.8
|
ordinal_probability: 0.8
|
||||||
nivel: &nivel
|
nivel: &nivel
|
||||||
@@ -151,6 +153,9 @@ levels:
|
|||||||
direction_probability: 0.95
|
direction_probability: 0.95
|
||||||
standalone_probability: 0.2
|
standalone_probability: 0.2
|
||||||
null_phrase_probability: 0.6
|
null_phrase_probability: 0.6
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.2
|
numeric_probability: 0.2
|
||||||
ordinal_probability: 0.8
|
ordinal_probability: 0.8
|
||||||
|
|
||||||
@@ -176,6 +181,9 @@ levels:
|
|||||||
standalone_probability: 0.2 # Let e.g. 5º be the entire floor string
|
standalone_probability: 0.2 # Let e.g. 5º be the entire floor string
|
||||||
# If ordinal is selected, chance of e.g. just using 2o without Piso
|
# If ordinal is selected, chance of e.g. just using 2o without Piso
|
||||||
null_phrase_probability: 0.6
|
null_phrase_probability: 0.6
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.2
|
numeric_probability: 0.2
|
||||||
numeric_affix_probability: 0.05
|
numeric_affix_probability: 0.05
|
||||||
ordinal_probability: 0.75
|
ordinal_probability: 0.75
|
||||||
@@ -204,8 +212,7 @@ levels:
|
|||||||
terreo: &terreo
|
terreo: &terreo
|
||||||
canonical: terréo
|
canonical: terréo
|
||||||
sample: true
|
sample: true
|
||||||
canonical_probability: 0.3
|
canonical_probability: 0.7
|
||||||
abbreviated_probability: 0.4
|
|
||||||
sample_probability: 0.3
|
sample_probability: 0.3
|
||||||
baixos: &baixos
|
baixos: &baixos
|
||||||
canonical: baixos
|
canonical: baixos
|
||||||
@@ -241,6 +248,9 @@ levels:
|
|||||||
canonical: sub cave
|
canonical: sub cave
|
||||||
abbreviated: scv
|
abbreviated: scv
|
||||||
sample: true
|
sample: true
|
||||||
|
canonical_probability: 0.4
|
||||||
|
abbreviated_probability: 0.3
|
||||||
|
sample_probability: 0.3
|
||||||
# e.g. sub cave 1
|
# e.g. sub cave 1
|
||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
@@ -750,6 +760,10 @@ units:
|
|||||||
canonical: casa
|
canonical: casa
|
||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
|
moradia: &moradia
|
||||||
|
canonical: moradia
|
||||||
|
numeric:
|
||||||
|
direction: left
|
||||||
room: &sala
|
room: &sala
|
||||||
canonical: sala
|
canonical: sala
|
||||||
numeric:
|
numeric:
|
||||||
@@ -769,10 +783,12 @@ units:
|
|||||||
alternatives:
|
alternatives:
|
||||||
- alternative: *sala
|
- alternative: *sala
|
||||||
probability: 0.1
|
probability: 0.1
|
||||||
- alternative: *casa
|
|
||||||
probability: 0.05
|
|
||||||
- alternative: *porta
|
- alternative: *porta
|
||||||
probability: 0.05
|
probability: 0.05
|
||||||
|
- alternative: *casa
|
||||||
|
probability: 0.04
|
||||||
|
- alternative: *moradia
|
||||||
|
probability: 0.01
|
||||||
|
|
||||||
# Separate random probability for adding directions like 2o Izq, 2 Dcha, etc.
|
# Separate random probability for adding directions like 2o Izq, 2 Dcha, etc.
|
||||||
add_direction: true
|
add_direction: true
|
||||||
@@ -796,7 +812,9 @@ units:
|
|||||||
- alternative: *sala
|
- alternative: *sala
|
||||||
probability: 0.1
|
probability: 0.1
|
||||||
- alternative: *casa
|
- alternative: *casa
|
||||||
probability: 0.03
|
probability: 0.02
|
||||||
|
- alternative: *moradia
|
||||||
|
probability: 0.01
|
||||||
- alternative: *porta
|
- alternative: *porta
|
||||||
probability: 0.05
|
probability: 0.05
|
||||||
- alternative: *letra
|
- alternative: *letra
|
||||||
@@ -903,7 +921,7 @@ countries:
|
|||||||
levels:
|
levels:
|
||||||
numbering_starts_at: 1
|
numbering_starts_at: 1
|
||||||
aliases:
|
aliases:
|
||||||
"0":
|
"0": &ground_floor_brasil
|
||||||
default: *andar_terreo
|
default: *andar_terreo
|
||||||
probability: 0.4
|
probability: 0.4
|
||||||
alternatives:
|
alternatives:
|
||||||
@@ -920,7 +938,7 @@ countries:
|
|||||||
probability: 0.05
|
probability: 0.05
|
||||||
- alternative: *piso
|
- alternative: *piso
|
||||||
probability: 0.01
|
probability: 0.01
|
||||||
|
"1": *ground_floor_brasil
|
||||||
|
|
||||||
postcodes:
|
postcodes:
|
||||||
alphanumeric:
|
alphanumeric:
|
||||||
@@ -929,8 +947,8 @@ countries:
|
|||||||
abbreviated: cep
|
abbreviated: cep
|
||||||
sample: true
|
sample: true
|
||||||
canonical_probability: 0.001
|
canonical_probability: 0.001
|
||||||
abbreviated_probability: 0.995
|
abbreviated_probability: 0.949
|
||||||
sample_probability: 0.004
|
sample_probability: 0.05
|
||||||
|
|
||||||
numeric:
|
numeric:
|
||||||
# Postcodes in Brazil are sometimes prefixed by CEP
|
# Postcodes in Brazil are sometimes prefixed by CEP
|
||||||
@@ -945,7 +963,7 @@ countries:
|
|||||||
numeric_affix_probability: 0.12
|
numeric_affix_probability: 0.12
|
||||||
strict_numeric: true
|
strict_numeric: true
|
||||||
|
|
||||||
po_boxes:
|
po_boxes: &po_boxes_caixa_postal
|
||||||
alphanumeric:
|
alphanumeric:
|
||||||
default:
|
default:
|
||||||
canonical: caixa postal
|
canonical: caixa postal
|
||||||
@@ -982,3 +1000,55 @@ countries:
|
|||||||
probability: 0.05
|
probability: 0.05
|
||||||
- alternative: *letra
|
- alternative: *letra
|
||||||
probability: 0.05
|
probability: 0.05
|
||||||
|
|
||||||
|
# Angola
|
||||||
|
ao:
|
||||||
|
postcodes: &postcodes_codigo_postal
|
||||||
|
alphanumeric:
|
||||||
|
default:
|
||||||
|
canonical: código postal
|
||||||
|
abbreviated: cp
|
||||||
|
sample: true
|
||||||
|
canonical_probability: 0.001
|
||||||
|
abbreviated_probability: 0.949
|
||||||
|
sample_probability: 0.05
|
||||||
|
|
||||||
|
numeric:
|
||||||
|
direction: left
|
||||||
|
|
||||||
|
numeric_affix:
|
||||||
|
affix: cp
|
||||||
|
direction: left
|
||||||
|
# null_probability means the chance of doing nothing e.g. just the postal code
|
||||||
|
null_probability: 0.7
|
||||||
|
numeric_probability: 0.18
|
||||||
|
numeric_affix_probability: 0.12
|
||||||
|
strict_numeric: true
|
||||||
|
|
||||||
|
po_boxes: *po_boxes_caixa_postal
|
||||||
|
|
||||||
|
# Mozambique
|
||||||
|
mz:
|
||||||
|
postcodes: *postcodes_codigo_postal
|
||||||
|
po_boxes: *po_boxes_caixa_postal
|
||||||
|
|
||||||
|
# Cape Verde
|
||||||
|
cv:
|
||||||
|
po_boxes: *po_boxes_caixa_postal
|
||||||
|
|
||||||
|
|
||||||
|
# East Timor
|
||||||
|
tl:
|
||||||
|
po_boxes: *po_boxes_caixa_postal
|
||||||
|
|
||||||
|
# São Tome and Principe
|
||||||
|
st:
|
||||||
|
po_boxes: *po_boxes_caixa_postal
|
||||||
|
|
||||||
|
# Guinea-Bissau
|
||||||
|
gw:
|
||||||
|
po_boxes: *po_boxes_caixa_postal
|
||||||
|
|
||||||
|
# Macau
|
||||||
|
mo:
|
||||||
|
po_boxes: *po_boxes_caixa_postal
|
||||||
|
|||||||
@@ -114,7 +114,9 @@ levels:
|
|||||||
direction: left
|
direction: left
|
||||||
add_number_phrase: true # Occasionally add variation of "number", e.g. et. nr 2
|
add_number_phrase: true # Occasionally add variation of "number", e.g. et. nr 2
|
||||||
add_number_phrase_probability: 0.05
|
add_number_phrase_probability: 0.05
|
||||||
roman_numeral_probability: 0.2
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
roman_numeral_probability: 0.2
|
||||||
# Ground floor
|
# Ground floor
|
||||||
parter: &parter
|
parter: &parter
|
||||||
canonical: parter
|
canonical: parter
|
||||||
|
|||||||
@@ -53,8 +53,8 @@ house_number:
|
|||||||
canonical: дом
|
canonical: дом
|
||||||
abbreviated: д
|
abbreviated: д
|
||||||
sample: true
|
sample: true
|
||||||
canonical_probability: 0.8
|
canonical_probability: 0.6
|
||||||
abbreviated_probability: 0.1
|
abbreviated_probability: 0.3
|
||||||
sample_probability: 0.1
|
sample_probability: 0.1
|
||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
@@ -62,8 +62,8 @@ house_number:
|
|||||||
canonical: dom
|
canonical: dom
|
||||||
abbreviated: d
|
abbreviated: d
|
||||||
sample: true
|
sample: true
|
||||||
canonical_probability: 0.8
|
canonical_probability: 0.6
|
||||||
abbreviated_probability: 0.1
|
abbreviated_probability: 0.3
|
||||||
sample_probability: 0.1
|
sample_probability: 0.1
|
||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
@@ -95,8 +95,8 @@ and:
|
|||||||
|
|
||||||
|
|
||||||
cross_streets:
|
cross_streets:
|
||||||
and: *i
|
i: *i
|
||||||
and: *i_latin
|
i_latin: *i_latin
|
||||||
corner: &ugol
|
corner: &ugol
|
||||||
canonical: угол
|
canonical: угол
|
||||||
sample: true
|
sample: true
|
||||||
@@ -177,6 +177,9 @@ levels:
|
|||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
|
digits:
|
||||||
|
ascii_probability: 0.8
|
||||||
|
spellout_probability: 0.2
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
etazh_latin: &etazh_latin
|
etazh_latin: &etazh_latin
|
||||||
@@ -217,6 +220,26 @@ levels:
|
|||||||
direction: right
|
direction: right
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
|
pervyy_etazh: &pervyy_etazh
|
||||||
|
canonical: первый этаж
|
||||||
|
sample: true
|
||||||
|
canonical_probability: 0.9
|
||||||
|
sample_probability: 0.1
|
||||||
|
pervyy_etazh_latin: &pervyy_etazh_latin
|
||||||
|
canonical: pervyy etazh
|
||||||
|
sample: true
|
||||||
|
canonical_probability: 0.9
|
||||||
|
sample_probability: 0.1
|
||||||
|
nizhniy_etazh: &nizhniy_etazh
|
||||||
|
canonical: нижний этаж
|
||||||
|
sample: true
|
||||||
|
canonical_probability: 0.9
|
||||||
|
sample_probability: 0.1
|
||||||
|
nizhniy_etazh_latin: &nizhniy_etazh_latin
|
||||||
|
canonical: nizhniy etazh
|
||||||
|
sample: true
|
||||||
|
canonical_probability: 0.9
|
||||||
|
sample_probability: 0.1
|
||||||
tsokolnyy_etazh: &tsokolnyy_etazh
|
tsokolnyy_etazh: &tsokolnyy_etazh
|
||||||
canonical: цокольный этаж
|
canonical: цокольный этаж
|
||||||
abbreviated: цок эт
|
abbreviated: цок эт
|
||||||
@@ -295,7 +318,20 @@ levels:
|
|||||||
probability: 0.09
|
probability: 0.09
|
||||||
- alternative: *etazh_latin
|
- alternative: *etazh_latin
|
||||||
probability: 0.01
|
probability: 0.01
|
||||||
"0": *ground_floor
|
"0":
|
||||||
|
default: *pervyy_etazh
|
||||||
|
probability: 0.6
|
||||||
|
alternatives:
|
||||||
|
- alternative: *pervyy_etazh_latin
|
||||||
|
probability: 0.05
|
||||||
|
- alternative: *nizhniy_etazh
|
||||||
|
probability: 0.2
|
||||||
|
- alternative: *nizhniy_etazh_latin
|
||||||
|
probability: 0.05
|
||||||
|
- alternative: *tsokolnyy_etazh
|
||||||
|
probability: 0.075
|
||||||
|
- alternative: *tsokolnyy_etazh_latin
|
||||||
|
probability: 0.025
|
||||||
|
|
||||||
numbering_starts_at: 0
|
numbering_starts_at: 0
|
||||||
|
|
||||||
@@ -321,7 +357,7 @@ categories:
|
|||||||
sample: true
|
sample: true
|
||||||
canonical_probability: 0.8
|
canonical_probability: 0.8
|
||||||
sample_probability: 0.2
|
sample_probability: 0.2
|
||||||
probability: 0.74
|
probability: 0.69
|
||||||
alternatives:
|
alternatives:
|
||||||
- alternative:
|
- alternative:
|
||||||
canonical: vblizi
|
canonical: vblizi
|
||||||
@@ -347,6 +383,18 @@ categories:
|
|||||||
canonical_probability: 0.8
|
canonical_probability: 0.8
|
||||||
sample_probability: 0.2
|
sample_probability: 0.2
|
||||||
probability: 0.04
|
probability: 0.04
|
||||||
|
- alternative:
|
||||||
|
canonical: под
|
||||||
|
sample: true
|
||||||
|
canonical_probability: 0.8
|
||||||
|
sample_probability: 0.2
|
||||||
|
probability: 0.04
|
||||||
|
- alternative:
|
||||||
|
canonical: pod
|
||||||
|
sample: true
|
||||||
|
canonical_probability: 0.8
|
||||||
|
sample_probability: 0.2
|
||||||
|
probability: 0.01
|
||||||
- alternative:
|
- alternative:
|
||||||
canonical: okolo
|
canonical: okolo
|
||||||
sample: true
|
sample: true
|
||||||
|
|||||||
@@ -101,12 +101,16 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
add_number_phrase: true
|
add_number_phrase: true
|
||||||
add_number_phrase_probability: 0.1
|
add_number_phrase_probability: 0.1
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.7
|
digits:
|
||||||
|
ascii_probability: 0.3
|
||||||
|
roman_numeral_probability: 0.7
|
||||||
add_number_phrase: true
|
add_number_phrase: true
|
||||||
add_number_phrase_probability: 0.1
|
add_number_phrase_probability: 0.1
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
@@ -119,12 +123,16 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
add_number_phrase: true
|
add_number_phrase: true
|
||||||
add_number_phrase_probability: 0.1
|
add_number_phrase_probability: 0.1
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.7
|
digits:
|
||||||
|
ascii_probability: 0.3
|
||||||
|
roman_numeral_probability: 0.7
|
||||||
add_number_phrase: true
|
add_number_phrase: true
|
||||||
add_number_phrase_probability: 0.1
|
add_number_phrase_probability: 0.1
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
@@ -140,10 +148,14 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
etaz: &etaz
|
etaz: &etaz
|
||||||
@@ -154,10 +166,14 @@ levels:
|
|||||||
numeric:
|
numeric:
|
||||||
direction: left
|
direction: left
|
||||||
direction_probability: 0.9
|
direction_probability: 0.9
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
numeric_probability: 0.4
|
numeric_probability: 0.4
|
||||||
ordinal_probability: 0.6
|
ordinal_probability: 0.6
|
||||||
prizemie: &prizemie
|
prizemie: &prizemie
|
||||||
@@ -183,7 +199,9 @@ levels:
|
|||||||
# e.g. 1. podzemné podlažie
|
# e.g. 1. podzemné podlažie
|
||||||
ordinal:
|
ordinal:
|
||||||
direction: right
|
direction: right
|
||||||
roman_numeral_probability: 0.3
|
digits:
|
||||||
|
ascii_probability: 0.7
|
||||||
|
roman_numeral_probability: 0.3
|
||||||
standalone_probability: 0.985
|
standalone_probability: 0.985
|
||||||
number_abs_value: true
|
number_abs_value: true
|
||||||
number_min_abs_value: 1
|
number_min_abs_value: 1
|
||||||
|
|||||||
@@ -117,6 +117,7 @@ po_boxes:
|
|||||||
affix: 邮政信箱
|
affix: 邮政信箱
|
||||||
direction: left
|
direction: left
|
||||||
digits:
|
digits:
|
||||||
|
ascii_probability: 0.3
|
||||||
unicode_full_width_probability: 0.5
|
unicode_full_width_probability: 0.5
|
||||||
spellout_probability: 0.2
|
spellout_probability: 0.2
|
||||||
use_number_phrase: true
|
use_number_phrase: true
|
||||||
@@ -129,6 +130,7 @@ po_boxes:
|
|||||||
affix: 郵政信箱
|
affix: 郵政信箱
|
||||||
direction: left
|
direction: left
|
||||||
digits:
|
digits:
|
||||||
|
ascii_probability: 0.3
|
||||||
unicode_full_width_probability: 0.5
|
unicode_full_width_probability: 0.5
|
||||||
spellout_probability: 0.2
|
spellout_probability: 0.2
|
||||||
use_number_phrase: true
|
use_number_phrase: true
|
||||||
|
|||||||
Reference in New Issue
Block a user