From fda639f29958282e8e6336247daa939e7c17c93b Mon Sep 17 00:00:00 2001 From: Al Date: Wed, 18 Jan 2017 20:04:33 -0500 Subject: [PATCH] =?UTF-8?q?[dictionaries/addresses]=20adding=20=D0=B1?= =?UTF-8?q?=D0=B5=D0=B7=20=D0=BD=D0=BE=D0=BC=D0=B5=D1=80=D0=B0=20(=D0=B1/?= =?UTF-8?q?=D0=BD)=20for=20addresses=20with=20no=20number=20in=20Russian?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- resources/addresses/ru.yaml | 11 +++++++++++ resources/dictionaries/ru/no_number.txt | 1 + 2 files changed, 12 insertions(+) create mode 100644 resources/dictionaries/ru/no_number.txt diff --git a/resources/addresses/ru.yaml b/resources/addresses/ru.yaml index 0244b663..5651a5b4 100644 --- a/resources/addresses/ru.yaml +++ b/resources/addresses/ru.yaml @@ -125,8 +125,19 @@ house_numbers: - alternative: *dom_latin probability: 0.05 + # без номера (б/н) addresses + no_number: + default: + canonical: без номера + abbreviated: б/н + sample: true + canonical_probability: 0.1 + abbreviated_probability: 0.7 + sample_probability: 0.2 + # Very common in Russian to write dom/d alphanumeric_phrase_probability: 0.6 + no_number_probability: 0.1 # With this probability, use без номера if no house_number is specified and: default: &i diff --git a/resources/dictionaries/ru/no_number.txt b/resources/dictionaries/ru/no_number.txt new file mode 100644 index 00000000..0983819c --- /dev/null +++ b/resources/dictionaries/ru/no_number.txt @@ -0,0 +1 @@ +без номера|б / н|б.н.|б.н|бн \ No newline at end of file