From 837557ce975bab5f81b08812026e9ed8b279ff73 Mon Sep 17 00:00:00 2001 From: Al Date: Tue, 3 Mar 2015 18:45:37 -0500 Subject: [PATCH] [dictionaries] German dictionaries (including concatenated suffixes) --- .../de/academic_degrees/academic_degrees.txt | 4 ++ .../de/company_types/company_types.txt | 4 ++ .../concatenated_suffixes_inseparable | 3 ++ .../concatenated_suffixes_separable.txt | 12 ++++++ .../de/personal_suffixes/personal_suffixes | 2 + .../de/personal_titles/personal_titles.txt | 7 ++++ .../de/place_names/place_names.txt | 28 ++++++++++++++ .../dictionaries/de/qualifiers/qualifiers.txt | 3 ++ data/dictionaries/de/stopwords/stopwords.txt | 38 +++++++++++++++++++ .../de/street_types/street_types.txt | 35 +++++++++++++++++ data/dictionaries/de/synonyms/synonyms.txt | 3 ++ data/dictionaries/de/toponyms/toponyms.txt | 1 + .../dictionaries/de/unit_types/unit_types.txt | 2 + 13 files changed, 142 insertions(+) create mode 100644 data/dictionaries/de/academic_degrees/academic_degrees.txt create mode 100644 data/dictionaries/de/company_types/company_types.txt create mode 100644 data/dictionaries/de/concatenated_suffixes_inseparable/concatenated_suffixes_inseparable create mode 100644 data/dictionaries/de/concatenated_suffixes_separable/concatenated_suffixes_separable.txt create mode 100644 data/dictionaries/de/personal_suffixes/personal_suffixes create mode 100644 data/dictionaries/de/personal_titles/personal_titles.txt create mode 100644 data/dictionaries/de/place_names/place_names.txt create mode 100644 data/dictionaries/de/qualifiers/qualifiers.txt create mode 100644 data/dictionaries/de/stopwords/stopwords.txt create mode 100644 data/dictionaries/de/street_types/street_types.txt create mode 100644 data/dictionaries/de/synonyms/synonyms.txt create mode 100644 data/dictionaries/de/toponyms/toponyms.txt create mode 100644 data/dictionaries/de/unit_types/unit_types.txt diff --git a/data/dictionaries/de/academic_degrees/academic_degrees.txt b/data/dictionaries/de/academic_degrees/academic_degrees.txt new file mode 100644 index 00000000..ca8a6770 --- /dev/null +++ b/data/dictionaries/de/academic_degrees/academic_degrees.txt @@ -0,0 +1,4 @@ +diplom ingenieur|dipl ing +diplom kaufmann|dipl kfm +doktor de medizin|dr med +doktor der philosophie|dr phil \ No newline at end of file diff --git a/data/dictionaries/de/company_types/company_types.txt b/data/dictionaries/de/company_types/company_types.txt new file mode 100644 index 00000000..3a8099e3 --- /dev/null +++ b/data/dictionaries/de/company_types/company_types.txt @@ -0,0 +1,4 @@ +aktiengesellschaft|ag +firma|fa +fussball club|fc|f c +gmbh \ No newline at end of file diff --git a/data/dictionaries/de/concatenated_suffixes_inseparable/concatenated_suffixes_inseparable b/data/dictionaries/de/concatenated_suffixes_inseparable/concatenated_suffixes_inseparable new file mode 100644 index 00000000..fb4a2a70 --- /dev/null +++ b/data/dictionaries/de/concatenated_suffixes_inseparable/concatenated_suffixes_inseparable @@ -0,0 +1,3 @@ +berg|bg +burg|bg +dorf|df \ No newline at end of file diff --git a/data/dictionaries/de/concatenated_suffixes_separable/concatenated_suffixes_separable.txt b/data/dictionaries/de/concatenated_suffixes_separable/concatenated_suffixes_separable.txt new file mode 100644 index 00000000..5c90071e --- /dev/null +++ b/data/dictionaries/de/concatenated_suffixes_separable/concatenated_suffixes_separable.txt @@ -0,0 +1,12 @@ +allee +brucke|br +burgermeister|bgm +damm +gasse +hof +kamp +pfad +platz|pl +quelle|qu +strasse|str +weg|w \ No newline at end of file diff --git a/data/dictionaries/de/personal_suffixes/personal_suffixes b/data/dictionaries/de/personal_suffixes/personal_suffixes new file mode 100644 index 00000000..8aa1fd70 --- /dev/null +++ b/data/dictionaries/de/personal_suffixes/personal_suffixes @@ -0,0 +1,2 @@ +der jungere +der altere \ No newline at end of file diff --git a/data/dictionaries/de/personal_titles/personal_titles.txt b/data/dictionaries/de/personal_titles/personal_titles.txt new file mode 100644 index 00000000..58fce466 --- /dev/null +++ b/data/dictionaries/de/personal_titles/personal_titles.txt @@ -0,0 +1,7 @@ +doktor|dr +burgermeister|bgm +direktor|dir +herr|hr +herrn|hrn +ingnieur|ing +sankt|st \ No newline at end of file diff --git a/data/dictionaries/de/place_names/place_names.txt b/data/dictionaries/de/place_names/place_names.txt new file mode 100644 index 00000000..42c27025 --- /dev/null +++ b/data/dictionaries/de/place_names/place_names.txt @@ -0,0 +1,28 @@ +altstoffsammelzentrum|asz|a s z +apotheke +bundesgymnasium|bg|b g +bundesrealgymnasium|brg|b r g +allgemeiner deutscher automobil club|adac|a d a c +auswartiges amt|aa|a a +bank +bustenhalter|bh +cafe +denkmal|dkm +deutsche bahn|db|d b +deutscher alpenverein|dav|d a v +fabrik|fb +fachhochschule|fh +freiwillige feuerwehr|ff +gasthaus|gh +gasthof|ghf +hafen +haus +handelsakademie|hak +handelsschule|hasch +hotel +jungenherberge|jh|j h +kaffee +markt|mkt +marktplatz|markt platz|markt pl|mkt pl|marktpl +sportplatz|sport platz|sport pl|sportpl +restaurant \ No newline at end of file diff --git a/data/dictionaries/de/qualifiers/qualifiers.txt b/data/dictionaries/de/qualifiers/qualifiers.txt new file mode 100644 index 00000000..03b3db9e --- /dev/null +++ b/data/dictionaries/de/qualifiers/qualifiers.txt @@ -0,0 +1,3 @@ +bezirk|bez +gemeinde|gde +hauptstadt|hptst \ No newline at end of file diff --git a/data/dictionaries/de/stopwords/stopwords.txt b/data/dictionaries/de/stopwords/stopwords.txt new file mode 100644 index 00000000..c8636cef --- /dev/null +++ b/data/dictionaries/de/stopwords/stopwords.txt @@ -0,0 +1,38 @@ +am +an +an der|a.d.|a d +auf +auf der|a.d.|a d +bei|b +beim +bis +das +de +dem +den +der +des +die +du +fur +gegenuber +im|i +in|i +in der|id|i d +mit +nach +nachst +neben +ob|o +uber +und|& +unter +vor|v +von|v +von der|v d|vd +zu +zu der +zur +zu dem +zwischen +zum|z \ No newline at end of file diff --git a/data/dictionaries/de/street_types/street_types.txt b/data/dictionaries/de/street_types/street_types.txt new file mode 100644 index 00000000..756efb54 --- /dev/null +++ b/data/dictionaries/de/street_types/street_types.txt @@ -0,0 +1,35 @@ +allee|a|al +autobahn +bach +bad +bahnhof|bhf|bf +boulevard|bd +brucke|bruecke|br +buhl|buehl +chaussee|ch +damm|d +forsthaus|fh +gasse|g +graben|gr +grosser +grosse|gr|g +grosses +hauptbahnhof|hbf +heiligen +hof|h +kamp|k +kleine|kl +kleiner +kleines +obere|ob +oberer|ob +oberes +pfad|p +platz|pl +quelle|qu +rhein|rh +strasse|str +untere|u +unterer +unteres +weg|w \ No newline at end of file diff --git a/data/dictionaries/de/synonyms/synonyms.txt b/data/dictionaries/de/synonyms/synonyms.txt new file mode 100644 index 00000000..78a5de00 --- /dev/null +++ b/data/dictionaries/de/synonyms/synonyms.txt @@ -0,0 +1,3 @@ +deutsch|dt +ehemalige|ehem +haltestelle|hst \ No newline at end of file diff --git a/data/dictionaries/de/toponyms/toponyms.txt b/data/dictionaries/de/toponyms/toponyms.txt new file mode 100644 index 00000000..6d9657ab --- /dev/null +++ b/data/dictionaries/de/toponyms/toponyms.txt @@ -0,0 +1 @@ +burgenlaendische|burgenlandische|bgld \ No newline at end of file diff --git a/data/dictionaries/de/unit_types/unit_types.txt b/data/dictionaries/de/unit_types/unit_types.txt new file mode 100644 index 00000000..f6c95ae7 --- /dev/null +++ b/data/dictionaries/de/unit_types/unit_types.txt @@ -0,0 +1,2 @@ +abteilung|abt +buro \ No newline at end of file