From 21dbe3701c0a0bbc8281becd818cfcae259bb483 Mon Sep 17 00:00:00 2001 From: Jean Chalard Date: Tue, 18 Dec 2012 13:06:48 +0900 Subject: Update dictionaries MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit cs, da, de, el, es, fi, fr, hr, it, lt, lv, nb, nl, pl, pt_BR, pt_PT, sl, sr, sv, tr : rescale frequencies to match spec. This has no large effect in the practice except the dictionary will become stronger vs spatial model (especially in lower count corpora, like lt, lv, sr) en* : Small changes (rounding going the other way essentially) ru : the above rescaling, and remove the following words: Дре, ОСТа, Планше, легкими, легком, легкому, легкости, легкую, нелегкие, нелегкий, нелегким, нелегкое, нелегкой, нелегкую, полулегком and add нелёгкие, нелёгкое, нелёгкую; other accented forms were already in the dictionary. Change-Id: I40386c2ebd4d2be38874e822bde89db7cb512ae6 --- dictionaries/cs_wordlist.combined.gz | Bin 945721 -> 948225 bytes dictionaries/da_wordlist.combined.gz | Bin 1016252 -> 1017628 bytes dictionaries/de_wordlist.combined.gz | Bin 1291152 -> 1292066 bytes dictionaries/el_wordlist.combined.gz | Bin 1132398 -> 1134962 bytes dictionaries/en_GB_wordlist.combined.gz | Bin 859625 -> 859871 bytes dictionaries/en_wordlist.combined.gz | Bin 901947 -> 908317 bytes dictionaries/es_wordlist.combined.gz | Bin 948262 -> 951599 bytes dictionaries/fi_wordlist.combined.gz | Bin 1267631 -> 1269538 bytes dictionaries/fr_wordlist.combined.gz | Bin 1106190 -> 1107515 bytes dictionaries/hr_wordlist.combined.gz | Bin 1010674 -> 1014468 bytes dictionaries/it_wordlist.combined.gz | Bin 931870 -> 933663 bytes dictionaries/lt_wordlist.combined.gz | Bin 977866 -> 980858 bytes dictionaries/lv_wordlist.combined.gz | Bin 963904 -> 970342 bytes dictionaries/nb_wordlist.combined.gz | Bin 964442 -> 964815 bytes dictionaries/nl_wordlist.combined.gz | Bin 1050110 -> 1053208 bytes dictionaries/pl_wordlist.combined.gz | Bin 1086804 -> 1089244 bytes dictionaries/pt_BR_wordlist.combined.gz | Bin 876891 -> 878493 bytes dictionaries/pt_PT_wordlist.combined.gz | Bin 1102056 -> 1105813 bytes dictionaries/ru_wordlist.combined.gz | Bin 1379075 -> 1384484 bytes dictionaries/sl_wordlist.combined.gz | Bin 313077 -> 315122 bytes dictionaries/sr_wordlist.combined.gz | Bin 1049710 -> 1051980 bytes dictionaries/sv_wordlist.combined.gz | Bin 1137493 -> 1139229 bytes dictionaries/tr_wordlist.combined.gz | Bin 924020 -> 925907 bytes java/res/raw/main_de.dict | Bin 1605718 -> 1605718 bytes java/res/raw/main_en.dict | Bin 1069823 -> 1069823 bytes java/res/raw/main_es.dict | Bin 1138885 -> 1138885 bytes java/res/raw/main_fr.dict | Bin 1329621 -> 1329621 bytes java/res/raw/main_it.dict | Bin 1143329 -> 1143329 bytes java/res/raw/main_pt_br.dict | Bin 1091987 -> 1091987 bytes java/res/raw/main_ru.dict | Bin 2223791 -> 2228258 bytes 30 files changed, 0 insertions(+), 0 deletions(-) diff --git a/dictionaries/cs_wordlist.combined.gz b/dictionaries/cs_wordlist.combined.gz index 8cbf2e961..b8d4d60eb 100644 Binary files a/dictionaries/cs_wordlist.combined.gz and b/dictionaries/cs_wordlist.combined.gz differ diff --git a/dictionaries/da_wordlist.combined.gz b/dictionaries/da_wordlist.combined.gz index 1cccb8632..919d28e1d 100644 Binary files a/dictionaries/da_wordlist.combined.gz and b/dictionaries/da_wordlist.combined.gz differ diff --git a/dictionaries/de_wordlist.combined.gz b/dictionaries/de_wordlist.combined.gz index 207597a1b..8d0eb6c27 100644 Binary files a/dictionaries/de_wordlist.combined.gz and b/dictionaries/de_wordlist.combined.gz differ diff --git a/dictionaries/el_wordlist.combined.gz b/dictionaries/el_wordlist.combined.gz index b61da8918..74effa34b 100644 Binary files a/dictionaries/el_wordlist.combined.gz and b/dictionaries/el_wordlist.combined.gz differ diff --git a/dictionaries/en_GB_wordlist.combined.gz b/dictionaries/en_GB_wordlist.combined.gz index 594bff1de..ce70150af 100644 Binary files a/dictionaries/en_GB_wordlist.combined.gz and b/dictionaries/en_GB_wordlist.combined.gz differ diff --git a/dictionaries/en_wordlist.combined.gz b/dictionaries/en_wordlist.combined.gz index 4af2b2cdf..5276aaa0a 100644 Binary files a/dictionaries/en_wordlist.combined.gz and b/dictionaries/en_wordlist.combined.gz differ diff --git a/dictionaries/es_wordlist.combined.gz b/dictionaries/es_wordlist.combined.gz index 4e4456e47..e7f91259d 100644 Binary files a/dictionaries/es_wordlist.combined.gz and b/dictionaries/es_wordlist.combined.gz differ diff --git a/dictionaries/fi_wordlist.combined.gz b/dictionaries/fi_wordlist.combined.gz index 542f45c5c..272011659 100644 Binary files a/dictionaries/fi_wordlist.combined.gz and b/dictionaries/fi_wordlist.combined.gz differ diff --git a/dictionaries/fr_wordlist.combined.gz b/dictionaries/fr_wordlist.combined.gz index b5a1cc98c..b7a4e3520 100644 Binary files a/dictionaries/fr_wordlist.combined.gz and b/dictionaries/fr_wordlist.combined.gz differ diff --git a/dictionaries/hr_wordlist.combined.gz b/dictionaries/hr_wordlist.combined.gz index 573c3e8ac..68b15c202 100644 Binary files a/dictionaries/hr_wordlist.combined.gz and b/dictionaries/hr_wordlist.combined.gz differ diff --git a/dictionaries/it_wordlist.combined.gz b/dictionaries/it_wordlist.combined.gz index d143bc425..187e3b296 100644 Binary files a/dictionaries/it_wordlist.combined.gz and b/dictionaries/it_wordlist.combined.gz differ diff --git a/dictionaries/lt_wordlist.combined.gz b/dictionaries/lt_wordlist.combined.gz index 03cfa8426..019761690 100644 Binary files a/dictionaries/lt_wordlist.combined.gz and b/dictionaries/lt_wordlist.combined.gz differ diff --git a/dictionaries/lv_wordlist.combined.gz b/dictionaries/lv_wordlist.combined.gz index 6b2ee77d6..f2338c2e0 100644 Binary files a/dictionaries/lv_wordlist.combined.gz and b/dictionaries/lv_wordlist.combined.gz differ diff --git a/dictionaries/nb_wordlist.combined.gz b/dictionaries/nb_wordlist.combined.gz index 0644fc93a..d0d3d8be8 100644 Binary files a/dictionaries/nb_wordlist.combined.gz and b/dictionaries/nb_wordlist.combined.gz differ diff --git a/dictionaries/nl_wordlist.combined.gz b/dictionaries/nl_wordlist.combined.gz index 748c5ed77..7b4843f42 100644 Binary files a/dictionaries/nl_wordlist.combined.gz and b/dictionaries/nl_wordlist.combined.gz differ diff --git a/dictionaries/pl_wordlist.combined.gz b/dictionaries/pl_wordlist.combined.gz index 638c8eef5..12d523811 100644 Binary files a/dictionaries/pl_wordlist.combined.gz and b/dictionaries/pl_wordlist.combined.gz differ diff --git a/dictionaries/pt_BR_wordlist.combined.gz b/dictionaries/pt_BR_wordlist.combined.gz index 6f7952004..19394cb79 100644 Binary files a/dictionaries/pt_BR_wordlist.combined.gz and b/dictionaries/pt_BR_wordlist.combined.gz differ diff --git a/dictionaries/pt_PT_wordlist.combined.gz b/dictionaries/pt_PT_wordlist.combined.gz index d60a2fc4f..b29e4fd10 100644 Binary files a/dictionaries/pt_PT_wordlist.combined.gz and b/dictionaries/pt_PT_wordlist.combined.gz differ diff --git a/dictionaries/ru_wordlist.combined.gz b/dictionaries/ru_wordlist.combined.gz index c589aaa97..9fa7da5d4 100644 Binary files a/dictionaries/ru_wordlist.combined.gz and b/dictionaries/ru_wordlist.combined.gz differ diff --git a/dictionaries/sl_wordlist.combined.gz b/dictionaries/sl_wordlist.combined.gz index 845b55a8b..c12e7cb66 100644 Binary files a/dictionaries/sl_wordlist.combined.gz and b/dictionaries/sl_wordlist.combined.gz differ diff --git a/dictionaries/sr_wordlist.combined.gz b/dictionaries/sr_wordlist.combined.gz index c15bc48fd..bb85796b3 100644 Binary files a/dictionaries/sr_wordlist.combined.gz and b/dictionaries/sr_wordlist.combined.gz differ diff --git a/dictionaries/sv_wordlist.combined.gz b/dictionaries/sv_wordlist.combined.gz index ec399fbf5..b10c14b20 100644 Binary files a/dictionaries/sv_wordlist.combined.gz and b/dictionaries/sv_wordlist.combined.gz differ diff --git a/dictionaries/tr_wordlist.combined.gz b/dictionaries/tr_wordlist.combined.gz index 3e6ca3263..b33041559 100644 Binary files a/dictionaries/tr_wordlist.combined.gz and b/dictionaries/tr_wordlist.combined.gz differ diff --git a/java/res/raw/main_de.dict b/java/res/raw/main_de.dict index 59df8b829..a59f7823e 100644 Binary files a/java/res/raw/main_de.dict and b/java/res/raw/main_de.dict differ diff --git a/java/res/raw/main_en.dict b/java/res/raw/main_en.dict index 14dda8d83..e2fd2585e 100644 Binary files a/java/res/raw/main_en.dict and b/java/res/raw/main_en.dict differ diff --git a/java/res/raw/main_es.dict b/java/res/raw/main_es.dict index c010da343..ac15d3992 100644 Binary files a/java/res/raw/main_es.dict and b/java/res/raw/main_es.dict differ diff --git a/java/res/raw/main_fr.dict b/java/res/raw/main_fr.dict index ce4e199b4..5aed479c6 100644 Binary files a/java/res/raw/main_fr.dict and b/java/res/raw/main_fr.dict differ diff --git a/java/res/raw/main_it.dict b/java/res/raw/main_it.dict index 59b78d643..e289cefbe 100644 Binary files a/java/res/raw/main_it.dict and b/java/res/raw/main_it.dict differ diff --git a/java/res/raw/main_pt_br.dict b/java/res/raw/main_pt_br.dict index 2a8af6f6e..28db0ed74 100644 Binary files a/java/res/raw/main_pt_br.dict and b/java/res/raw/main_pt_br.dict differ diff --git a/java/res/raw/main_ru.dict b/java/res/raw/main_ru.dict index 8a1d215a3..011f22e10 100644 Binary files a/java/res/raw/main_ru.dict and b/java/res/raw/main_ru.dict differ -- cgit v1.2.3-83-g751a