From 18d6b8c63a35a599a819af4e5f2a82bf02f040c4 Mon Sep 17 00:00:00 2001 From: Al Date: Thu, 7 Jul 2016 03:38:06 -0400 Subject: [PATCH] [addresses] field combinations, Roman numerals and spellout for Russian config --- resources/addresses/ru.yaml | 89 ++++++++++++++++++++++++++++++++++--- 1 file changed, 83 insertions(+), 6 deletions(-) diff --git a/resources/addresses/ru.yaml b/resources/addresses/ru.yaml index 3a1cdf38..369f9970 100644 --- a/resources/addresses/ru.yaml +++ b/resources/addresses/ru.yaml @@ -24,6 +24,57 @@ components: alphanumeric_probability: 0.4 + combinations: + - + components: + - house_number + - staircase + - level + - unit + label: house_number + separators: + - separator: "/" + probability: 0.95 + - separator: "-" + probability: 0.05 + probability: 0.005 + - + components: + - house_number + - level + - unit + label: house_number + separators: + - separator: "/" + probability: 0.95 + - separator: "-" + probability: 0.05 + probability: 0.005 + - + components: + - house_number + - level + label: house_number + separators: + - separator: "/" + probability: 0.95 + - separator: "-" + probability: 0.05 + probability: 0.01 + # For unit types like 2/34 + - + components: + - house_number + - unit + label: house_number + separators: + - separator: "/" + probability: 0.95 + - separator: "-" + probability: 0.05 + probability: 0.005 + + numbers: default: &nomer canonical: номер @@ -175,10 +226,15 @@ levels: numeric: direction: left direction_probability: 0.9 + digits: + ascii_probability: 0.8 + roman_numeral_probability: 0.1 + spellout_probability: 0.1 ordinal: direction: right digits: - ascii_probability: 0.8 + ascii_probability: 0.5 + roman_numeral_probability: 0.3 spellout_probability: 0.2 numeric_probability: 0.4 ordinal_probability: 0.6 @@ -192,8 +248,16 @@ levels: numeric: direction: left direction_probability: 0.9 + digits: + ascii_probability: 0.8 + roman_numeral_probability: 0.1 + spellout_probability: 0.1 ordinal: direction: right + digits: + ascii_probability: 0.5 + roman_numeral_probability: 0.3 + spellout_probability: 0.2 numeric_probability: 0.4 ordinal_probability: 0.6 uroven: &uroven @@ -204,8 +268,16 @@ levels: numeric: direction: left direction_probability: 0.9 + digits: + ascii_probability: 0.8 + roman_numeral_probability: 0.1 + spellout_probability: 0.1 ordinal: direction: right + digits: + ascii_probability: 0.5 + roman_numeral_probability: 0.3 + spellout_probability: 0.2 numeric_probability: 0.4 ordinal_probability: 0.6 uroven_latin: &uroven_latin @@ -216,8 +288,16 @@ levels: numeric: direction: left direction_probability: 0.9 + digits: + ascii_probability: 0.8 + roman_numeral_probability: 0.1 + spellout_probability: 0.1 ordinal: direction: right + digits: + ascii_probability: 0.5 + roman_numeral_probability: 0.3 + spellout_probability: 0.2 numeric_probability: 0.4 ordinal_probability: 0.6 pervyy_etazh: &pervyy_etazh @@ -267,8 +347,6 @@ levels: direction: left ordinal: direction: right - ordinal: - direction: right number_abs_value: true number_min_abs_value: 2 # Basement 2 == Sub-basement 1 @@ -290,8 +368,6 @@ levels: direction: left ordinal: direction: right - ordinal: - direction: right number_abs_value: true number_min_abs_value: 2 # Basement 2 == Sub-basement 1 @@ -345,7 +421,8 @@ levels: probability: 0.09 - alternative: *uroven_latin probability: 0.01 - numeric_probability: 0.99 # With this probability, pick an integer + numeric_probability: 0.79 # With this probability, pick an integer + roman_numeral_probability: 0.2 alpha_probability: 0.0098 # With this probability, pick a letter e.g. A numeric_plus_alpha_probability: 0.0001 # e.g. 2A alpha_plus_numeric_probability: 0.0001 # e.g. A2