From 271800bbf993f91788a456f2cd1fe1774d84ef60 Mon Sep 17 00:00:00 2001 From: Al Date: Wed, 2 Mar 2016 15:52:38 -0500 Subject: [PATCH] [dictionaries] Adding all single letter tokens to ambiguous dictionaries so libpostal will always include an unexpanded version (e.g. for initials) --- resources/dictionaries/af/ambiguous_expansions.txt | 8 ++++++++ resources/dictionaries/be/ambiguous_expansions.txt | 8 ++++++++ resources/dictionaries/bg/ambiguous_expansions.txt | 2 ++ resources/dictionaries/bs/ambiguous_expansions.txt | 1 + resources/dictionaries/ca/ambiguous_expansions.txt | 8 ++++++++ resources/dictionaries/da/ambiguous_expansions.txt | 5 +++++ resources/dictionaries/de/ambiguous_expansions.txt | 14 ++++++++++++++ resources/dictionaries/en/ambiguous_expansions.txt | 3 +++ resources/dictionaries/es/ambiguous_expansions.txt | 9 +++++++++ resources/dictionaries/et/ambiguous_expansions.txt | 4 ++++ resources/dictionaries/eu/ambiguous_expansions.txt | 1 + resources/dictionaries/fi/ambiguous_expansions.txt | 4 ++++ resources/dictionaries/fr/ambiguous_expansions.txt | 13 ++++++++++++- resources/dictionaries/gl/ambiguous_expansions.txt | 5 +++++ .../dictionaries/gsw/ambiguous_expansions.txt | 1 + resources/dictionaries/hr/ambiguous_expansions.txt | 1 + resources/dictionaries/hu/ambiguous_expansions.txt | 1 + resources/dictionaries/it/ambiguous_expansions.txt | 7 +++++++ resources/dictionaries/ja/ambiguous_expansions.txt | 5 +++++ resources/dictionaries/ka/ambiguous_expansions.txt | 1 + resources/dictionaries/lt/ambiguous_expansions.txt | 5 +++++ resources/dictionaries/nb/ambiguous_expansions.txt | 6 ++++++ resources/dictionaries/nl/ambiguous_expansions.txt | 8 ++++++++ resources/dictionaries/pl/ambiguous_expansions.txt | 7 +++++++ resources/dictionaries/pt/ambiguous_expansions.txt | 10 ++++++++++ resources/dictionaries/ru/ambiguous_expansions.txt | 9 +++++++++ resources/dictionaries/sl/ambiguous_expansions.txt | 2 ++ resources/dictionaries/sv/ambiguous_expansions.txt | 7 +++++++ resources/dictionaries/tr/ambiguous_expansions.txt | 2 ++ resources/dictionaries/uk/ambiguous_expansions.txt | 1 + resources/dictionaries/vi/ambiguous_expansions.txt | 3 +++ 31 files changed, 160 insertions(+), 1 deletion(-) create mode 100644 resources/dictionaries/af/ambiguous_expansions.txt create mode 100644 resources/dictionaries/be/ambiguous_expansions.txt create mode 100644 resources/dictionaries/bg/ambiguous_expansions.txt create mode 100644 resources/dictionaries/bs/ambiguous_expansions.txt create mode 100644 resources/dictionaries/ca/ambiguous_expansions.txt create mode 100644 resources/dictionaries/da/ambiguous_expansions.txt create mode 100644 resources/dictionaries/de/ambiguous_expansions.txt create mode 100644 resources/dictionaries/es/ambiguous_expansions.txt create mode 100644 resources/dictionaries/et/ambiguous_expansions.txt create mode 100644 resources/dictionaries/eu/ambiguous_expansions.txt create mode 100644 resources/dictionaries/fi/ambiguous_expansions.txt create mode 100644 resources/dictionaries/gl/ambiguous_expansions.txt create mode 100644 resources/dictionaries/gsw/ambiguous_expansions.txt create mode 100644 resources/dictionaries/hr/ambiguous_expansions.txt create mode 100644 resources/dictionaries/hu/ambiguous_expansions.txt create mode 100644 resources/dictionaries/it/ambiguous_expansions.txt create mode 100644 resources/dictionaries/ja/ambiguous_expansions.txt create mode 100644 resources/dictionaries/ka/ambiguous_expansions.txt create mode 100644 resources/dictionaries/lt/ambiguous_expansions.txt create mode 100644 resources/dictionaries/nb/ambiguous_expansions.txt create mode 100644 resources/dictionaries/nl/ambiguous_expansions.txt create mode 100644 resources/dictionaries/pl/ambiguous_expansions.txt create mode 100644 resources/dictionaries/pt/ambiguous_expansions.txt create mode 100644 resources/dictionaries/ru/ambiguous_expansions.txt create mode 100644 resources/dictionaries/sl/ambiguous_expansions.txt create mode 100644 resources/dictionaries/sv/ambiguous_expansions.txt create mode 100644 resources/dictionaries/tr/ambiguous_expansions.txt create mode 100644 resources/dictionaries/uk/ambiguous_expansions.txt create mode 100644 resources/dictionaries/vi/ambiguous_expansions.txt diff --git a/resources/dictionaries/af/ambiguous_expansions.txt b/resources/dictionaries/af/ambiguous_expansions.txt new file mode 100644 index 00000000..809bf5af --- /dev/null +++ b/resources/dictionaries/af/ambiguous_expansions.txt @@ -0,0 +1,8 @@ +h +k +l +n +o +s +v +w \ No newline at end of file diff --git a/resources/dictionaries/be/ambiguous_expansions.txt b/resources/dictionaries/be/ambiguous_expansions.txt new file mode 100644 index 00000000..e5131e30 --- /dev/null +++ b/resources/dictionaries/be/ambiguous_expansions.txt @@ -0,0 +1,8 @@ +d +h +k +s +г +д +к +ш \ No newline at end of file diff --git a/resources/dictionaries/bg/ambiguous_expansions.txt b/resources/dictionaries/bg/ambiguous_expansions.txt new file mode 100644 index 00000000..b08b8435 --- /dev/null +++ b/resources/dictionaries/bg/ambiguous_expansions.txt @@ -0,0 +1,2 @@ +s +с \ No newline at end of file diff --git a/resources/dictionaries/bs/ambiguous_expansions.txt b/resources/dictionaries/bs/ambiguous_expansions.txt new file mode 100644 index 00000000..3410062b --- /dev/null +++ b/resources/dictionaries/bs/ambiguous_expansions.txt @@ -0,0 +1 @@ +c \ No newline at end of file diff --git a/resources/dictionaries/ca/ambiguous_expansions.txt b/resources/dictionaries/ca/ambiguous_expansions.txt new file mode 100644 index 00000000..60685bd0 --- /dev/null +++ b/resources/dictionaries/ca/ambiguous_expansions.txt @@ -0,0 +1,8 @@ +b +d +e +h +n +o +s +v \ No newline at end of file diff --git a/resources/dictionaries/da/ambiguous_expansions.txt b/resources/dictionaries/da/ambiguous_expansions.txt new file mode 100644 index 00000000..a0fd62aa --- /dev/null +++ b/resources/dictionaries/da/ambiguous_expansions.txt @@ -0,0 +1,5 @@ +n +o +s +v +ø \ No newline at end of file diff --git a/resources/dictionaries/de/ambiguous_expansions.txt b/resources/dictionaries/de/ambiguous_expansions.txt new file mode 100644 index 00000000..45c3d48b --- /dev/null +++ b/resources/dictionaries/de/ambiguous_expansions.txt @@ -0,0 +1,14 @@ +a +b +d +g +h +i +k +n +o +s +u +v +w +z \ No newline at end of file diff --git a/resources/dictionaries/en/ambiguous_expansions.txt b/resources/dictionaries/en/ambiguous_expansions.txt index 8ce96508..f46bf831 100644 --- a/resources/dictionaries/en/ambiguous_expansions.txt +++ b/resources/dictionaries/en/ambiguous_expansions.txt @@ -14,7 +14,9 @@ ct de dc e +f fl +g ga hi i @@ -22,6 +24,7 @@ id il in ia +j jbt ks ky diff --git a/resources/dictionaries/es/ambiguous_expansions.txt b/resources/dictionaries/es/ambiguous_expansions.txt new file mode 100644 index 00000000..cd9440b6 --- /dev/null +++ b/resources/dictionaries/es/ambiguous_expansions.txt @@ -0,0 +1,9 @@ +c +d +e +g +n +p +s +v +w \ No newline at end of file diff --git a/resources/dictionaries/et/ambiguous_expansions.txt b/resources/dictionaries/et/ambiguous_expansions.txt new file mode 100644 index 00000000..d97bc2d4 --- /dev/null +++ b/resources/dictionaries/et/ambiguous_expansions.txt @@ -0,0 +1,4 @@ +k +l +p +t \ No newline at end of file diff --git a/resources/dictionaries/eu/ambiguous_expansions.txt b/resources/dictionaries/eu/ambiguous_expansions.txt new file mode 100644 index 00000000..23fa7d31 --- /dev/null +++ b/resources/dictionaries/eu/ambiguous_expansions.txt @@ -0,0 +1 @@ +k \ No newline at end of file diff --git a/resources/dictionaries/fi/ambiguous_expansions.txt b/resources/dictionaries/fi/ambiguous_expansions.txt new file mode 100644 index 00000000..48370ef9 --- /dev/null +++ b/resources/dictionaries/fi/ambiguous_expansions.txt @@ -0,0 +1,4 @@ +k +p +r +t \ No newline at end of file diff --git a/resources/dictionaries/fr/ambiguous_expansions.txt b/resources/dictionaries/fr/ambiguous_expansions.txt index c1b6a9a6..ca1ae415 100644 --- a/resources/dictionaries/fr/ambiguous_expansions.txt +++ b/resources/dictionaries/fr/ambiguous_expansions.txt @@ -1,13 +1,24 @@ +a ab bc +c +e +g +m +n mb nb nl ns nt nu +o on +p pe qc +r +s sk -yt \ No newline at end of file +yt +z diff --git a/resources/dictionaries/gl/ambiguous_expansions.txt b/resources/dictionaries/gl/ambiguous_expansions.txt new file mode 100644 index 00000000..4634c792 --- /dev/null +++ b/resources/dictionaries/gl/ambiguous_expansions.txt @@ -0,0 +1,5 @@ +e +n +o +r +s \ No newline at end of file diff --git a/resources/dictionaries/gsw/ambiguous_expansions.txt b/resources/dictionaries/gsw/ambiguous_expansions.txt new file mode 100644 index 00000000..6bf0c97a --- /dev/null +++ b/resources/dictionaries/gsw/ambiguous_expansions.txt @@ -0,0 +1 @@ +w \ No newline at end of file diff --git a/resources/dictionaries/hr/ambiguous_expansions.txt b/resources/dictionaries/hr/ambiguous_expansions.txt new file mode 100644 index 00000000..3410062b --- /dev/null +++ b/resources/dictionaries/hr/ambiguous_expansions.txt @@ -0,0 +1 @@ +c \ No newline at end of file diff --git a/resources/dictionaries/hu/ambiguous_expansions.txt b/resources/dictionaries/hu/ambiguous_expansions.txt new file mode 100644 index 00000000..f3c6c3c6 --- /dev/null +++ b/resources/dictionaries/hu/ambiguous_expansions.txt @@ -0,0 +1 @@ +u \ No newline at end of file diff --git a/resources/dictionaries/it/ambiguous_expansions.txt b/resources/dictionaries/it/ambiguous_expansions.txt new file mode 100644 index 00000000..1bcea6fb --- /dev/null +++ b/resources/dictionaries/it/ambiguous_expansions.txt @@ -0,0 +1,7 @@ +c +e +l +n +o +s +v \ No newline at end of file diff --git a/resources/dictionaries/ja/ambiguous_expansions.txt b/resources/dictionaries/ja/ambiguous_expansions.txt new file mode 100644 index 00000000..aad01a2a --- /dev/null +++ b/resources/dictionaries/ja/ambiguous_expansions.txt @@ -0,0 +1,5 @@ +中 +大 +小 +銀 +高 \ No newline at end of file diff --git a/resources/dictionaries/ka/ambiguous_expansions.txt b/resources/dictionaries/ka/ambiguous_expansions.txt new file mode 100644 index 00000000..926a453d --- /dev/null +++ b/resources/dictionaries/ka/ambiguous_expansions.txt @@ -0,0 +1 @@ +ქ \ No newline at end of file diff --git a/resources/dictionaries/lt/ambiguous_expansions.txt b/resources/dictionaries/lt/ambiguous_expansions.txt new file mode 100644 index 00000000..bd110234 --- /dev/null +++ b/resources/dictionaries/lt/ambiguous_expansions.txt @@ -0,0 +1,5 @@ +a +g +k +m +r \ No newline at end of file diff --git a/resources/dictionaries/nb/ambiguous_expansions.txt b/resources/dictionaries/nb/ambiguous_expansions.txt new file mode 100644 index 00000000..e98536a1 --- /dev/null +++ b/resources/dictionaries/nb/ambiguous_expansions.txt @@ -0,0 +1,6 @@ +g +n +o +s +v +ø \ No newline at end of file diff --git a/resources/dictionaries/nl/ambiguous_expansions.txt b/resources/dictionaries/nl/ambiguous_expansions.txt new file mode 100644 index 00000000..daebdfc9 --- /dev/null +++ b/resources/dictionaries/nl/ambiguous_expansions.txt @@ -0,0 +1,8 @@ +h +k +l +n +o +v +w +z \ No newline at end of file diff --git a/resources/dictionaries/pl/ambiguous_expansions.txt b/resources/dictionaries/pl/ambiguous_expansions.txt new file mode 100644 index 00000000..4acdf586 --- /dev/null +++ b/resources/dictionaries/pl/ambiguous_expansions.txt @@ -0,0 +1,7 @@ +g +k +m +o +p +u +w \ No newline at end of file diff --git a/resources/dictionaries/pt/ambiguous_expansions.txt b/resources/dictionaries/pt/ambiguous_expansions.txt new file mode 100644 index 00000000..9cc53462 --- /dev/null +++ b/resources/dictionaries/pt/ambiguous_expansions.txt @@ -0,0 +1,10 @@ +b +d +e +l +n +o +q +r +s +v \ No newline at end of file diff --git a/resources/dictionaries/ru/ambiguous_expansions.txt b/resources/dictionaries/ru/ambiguous_expansions.txt new file mode 100644 index 00000000..fc8d34fa --- /dev/null +++ b/resources/dictionaries/ru/ambiguous_expansions.txt @@ -0,0 +1,9 @@ +d +g +k +o +г +д +к +о +ш \ No newline at end of file diff --git a/resources/dictionaries/sl/ambiguous_expansions.txt b/resources/dictionaries/sl/ambiguous_expansions.txt new file mode 100644 index 00000000..7be1ea7c --- /dev/null +++ b/resources/dictionaries/sl/ambiguous_expansions.txt @@ -0,0 +1,2 @@ +c +v \ No newline at end of file diff --git a/resources/dictionaries/sv/ambiguous_expansions.txt b/resources/dictionaries/sv/ambiguous_expansions.txt new file mode 100644 index 00000000..dfb0bf5f --- /dev/null +++ b/resources/dictionaries/sv/ambiguous_expansions.txt @@ -0,0 +1,7 @@ +g +l +n +o +s +v +ö \ No newline at end of file diff --git a/resources/dictionaries/tr/ambiguous_expansions.txt b/resources/dictionaries/tr/ambiguous_expansions.txt new file mode 100644 index 00000000..3b23df14 --- /dev/null +++ b/resources/dictionaries/tr/ambiguous_expansions.txt @@ -0,0 +1,2 @@ +d +k \ No newline at end of file diff --git a/resources/dictionaries/uk/ambiguous_expansions.txt b/resources/dictionaries/uk/ambiguous_expansions.txt new file mode 100644 index 00000000..46b2a9ba --- /dev/null +++ b/resources/dictionaries/uk/ambiguous_expansions.txt @@ -0,0 +1 @@ +ш \ No newline at end of file diff --git a/resources/dictionaries/vi/ambiguous_expansions.txt b/resources/dictionaries/vi/ambiguous_expansions.txt new file mode 100644 index 00000000..e90c0293 --- /dev/null +++ b/resources/dictionaries/vi/ambiguous_expansions.txt @@ -0,0 +1,3 @@ +d +p +q \ No newline at end of file