diff options
author | 2012-12-18 13:06:48 +0900 | |
---|---|---|
committer | 2012-12-18 13:06:48 +0900 | |
commit | 21dbe3701c0a0bbc8281becd818cfcae259bb483 (patch) | |
tree | 69490299f32dae609b24646357ca3f7c31aaffb9 | |
parent | c5da4365fbe6ff23a8db381ee7de6fa43fd7086b (diff) | |
download | latinime-21dbe3701c0a0bbc8281becd818cfcae259bb483.tar.gz latinime-21dbe3701c0a0bbc8281becd818cfcae259bb483.tar.xz latinime-21dbe3701c0a0bbc8281becd818cfcae259bb483.zip |
Update dictionaries
cs, da, de, el, es, fi, fr, hr, it, lt, lv, nb, nl, pl,
pt_BR, pt_PT, sl, sr, sv, tr : rescale frequencies to match
spec. This has no large effect in the practice except the
dictionary will become stronger vs spatial model (especially in
lower count corpora, like lt, lv, sr)
en* : Small changes (rounding going the other way essentially)
ru : the above rescaling, and remove the following words:
Дре, ОСТа, Планше, легкими, легком, легкому, легкости,
легкую, нелегкие, нелегкий, нелегким, нелегкое, нелегкой,
нелегкую, полулегком and add нелёгкие, нелёгкое, нелёгкую;
other accented forms were already in the dictionary.
Change-Id: I40386c2ebd4d2be38874e822bde89db7cb512ae6
-rw-r--r-- | dictionaries/cs_wordlist.combined.gz | bin | 945721 -> 948225 bytes |
-rw-r--r-- | dictionaries/da_wordlist.combined.gz | bin | 1016252 -> 1017628 bytes |
-rw-r--r-- | dictionaries/de_wordlist.combined.gz | bin | 1291152 -> 1292066 bytes |
-rw-r--r-- | dictionaries/el_wordlist.combined.gz | bin | 1132398 -> 1134962 bytes |
-rw-r--r-- | dictionaries/en_GB_wordlist.combined.gz | bin | 859625 -> 859871 bytes |
-rw-r--r-- | dictionaries/en_wordlist.combined.gz | bin | 901947 -> 908317 bytes |
-rw-r--r-- | dictionaries/es_wordlist.combined.gz | bin | 948262 -> 951599 bytes |
-rw-r--r-- | dictionaries/fi_wordlist.combined.gz | bin | 1267631 -> 1269538 bytes |
-rw-r--r-- | dictionaries/fr_wordlist.combined.gz | bin | 1106190 -> 1107515 bytes |
-rw-r--r-- | dictionaries/hr_wordlist.combined.gz | bin | 1010674 -> 1014468 bytes |
-rw-r--r-- | dictionaries/it_wordlist.combined.gz | bin | 931870 -> 933663 bytes |
-rw-r--r-- | dictionaries/lt_wordlist.combined.gz | bin | 977866 -> 980858 bytes |
-rw-r--r-- | dictionaries/lv_wordlist.combined.gz | bin | 963904 -> 970342 bytes |
-rw-r--r-- | dictionaries/nb_wordlist.combined.gz | bin | 964442 -> 964815 bytes |
-rw-r--r-- | dictionaries/nl_wordlist.combined.gz | bin | 1050110 -> 1053208 bytes |
-rw-r--r-- | dictionaries/pl_wordlist.combined.gz | bin | 1086804 -> 1089244 bytes |
-rw-r--r-- | dictionaries/pt_BR_wordlist.combined.gz | bin | 876891 -> 878493 bytes |
-rw-r--r-- | dictionaries/pt_PT_wordlist.combined.gz | bin | 1102056 -> 1105813 bytes |
-rw-r--r-- | dictionaries/ru_wordlist.combined.gz | bin | 1379075 -> 1384484 bytes |
-rw-r--r-- | dictionaries/sl_wordlist.combined.gz | bin | 313077 -> 315122 bytes |
-rw-r--r-- | dictionaries/sr_wordlist.combined.gz | bin | 1049710 -> 1051980 bytes |
-rw-r--r-- | dictionaries/sv_wordlist.combined.gz | bin | 1137493 -> 1139229 bytes |
-rw-r--r-- | dictionaries/tr_wordlist.combined.gz | bin | 924020 -> 925907 bytes |
-rw-r--r-- | java/res/raw/main_de.dict | bin | 1605718 -> 1605718 bytes |
-rw-r--r-- | java/res/raw/main_en.dict | bin | 1069823 -> 1069823 bytes |
-rw-r--r-- | java/res/raw/main_es.dict | bin | 1138885 -> 1138885 bytes |
-rw-r--r-- | java/res/raw/main_fr.dict | bin | 1329621 -> 1329621 bytes |
-rw-r--r-- | java/res/raw/main_it.dict | bin | 1143329 -> 1143329 bytes |
-rw-r--r-- | java/res/raw/main_pt_br.dict | bin | 1091987 -> 1091987 bytes |
-rw-r--r-- | java/res/raw/main_ru.dict | bin | 2223791 -> 2228258 bytes |
30 files changed, 0 insertions, 0 deletions
diff --git a/dictionaries/cs_wordlist.combined.gz b/dictionaries/cs_wordlist.combined.gz Binary files differindex 8cbf2e961..b8d4d60eb 100644 --- a/dictionaries/cs_wordlist.combined.gz +++ b/dictionaries/cs_wordlist.combined.gz diff --git a/dictionaries/da_wordlist.combined.gz b/dictionaries/da_wordlist.combined.gz Binary files differindex 1cccb8632..919d28e1d 100644 --- a/dictionaries/da_wordlist.combined.gz +++ b/dictionaries/da_wordlist.combined.gz diff --git a/dictionaries/de_wordlist.combined.gz b/dictionaries/de_wordlist.combined.gz Binary files differindex 207597a1b..8d0eb6c27 100644 --- a/dictionaries/de_wordlist.combined.gz +++ b/dictionaries/de_wordlist.combined.gz diff --git a/dictionaries/el_wordlist.combined.gz b/dictionaries/el_wordlist.combined.gz Binary files differindex b61da8918..74effa34b 100644 --- a/dictionaries/el_wordlist.combined.gz +++ b/dictionaries/el_wordlist.combined.gz diff --git a/dictionaries/en_GB_wordlist.combined.gz b/dictionaries/en_GB_wordlist.combined.gz Binary files differindex 594bff1de..ce70150af 100644 --- a/dictionaries/en_GB_wordlist.combined.gz +++ b/dictionaries/en_GB_wordlist.combined.gz diff --git a/dictionaries/en_wordlist.combined.gz b/dictionaries/en_wordlist.combined.gz Binary files differindex 4af2b2cdf..5276aaa0a 100644 --- a/dictionaries/en_wordlist.combined.gz +++ b/dictionaries/en_wordlist.combined.gz diff --git a/dictionaries/es_wordlist.combined.gz b/dictionaries/es_wordlist.combined.gz Binary files differindex 4e4456e47..e7f91259d 100644 --- a/dictionaries/es_wordlist.combined.gz +++ b/dictionaries/es_wordlist.combined.gz diff --git a/dictionaries/fi_wordlist.combined.gz b/dictionaries/fi_wordlist.combined.gz Binary files differindex 542f45c5c..272011659 100644 --- a/dictionaries/fi_wordlist.combined.gz +++ b/dictionaries/fi_wordlist.combined.gz diff --git a/dictionaries/fr_wordlist.combined.gz b/dictionaries/fr_wordlist.combined.gz Binary files differindex b5a1cc98c..b7a4e3520 100644 --- a/dictionaries/fr_wordlist.combined.gz +++ b/dictionaries/fr_wordlist.combined.gz diff --git a/dictionaries/hr_wordlist.combined.gz b/dictionaries/hr_wordlist.combined.gz Binary files differindex 573c3e8ac..68b15c202 100644 --- a/dictionaries/hr_wordlist.combined.gz +++ b/dictionaries/hr_wordlist.combined.gz diff --git a/dictionaries/it_wordlist.combined.gz b/dictionaries/it_wordlist.combined.gz Binary files differindex d143bc425..187e3b296 100644 --- a/dictionaries/it_wordlist.combined.gz +++ b/dictionaries/it_wordlist.combined.gz diff --git a/dictionaries/lt_wordlist.combined.gz b/dictionaries/lt_wordlist.combined.gz Binary files differindex 03cfa8426..019761690 100644 --- a/dictionaries/lt_wordlist.combined.gz +++ b/dictionaries/lt_wordlist.combined.gz diff --git a/dictionaries/lv_wordlist.combined.gz b/dictionaries/lv_wordlist.combined.gz Binary files differindex 6b2ee77d6..f2338c2e0 100644 --- a/dictionaries/lv_wordlist.combined.gz +++ b/dictionaries/lv_wordlist.combined.gz diff --git a/dictionaries/nb_wordlist.combined.gz b/dictionaries/nb_wordlist.combined.gz Binary files differindex 0644fc93a..d0d3d8be8 100644 --- a/dictionaries/nb_wordlist.combined.gz +++ b/dictionaries/nb_wordlist.combined.gz diff --git a/dictionaries/nl_wordlist.combined.gz b/dictionaries/nl_wordlist.combined.gz Binary files differindex 748c5ed77..7b4843f42 100644 --- a/dictionaries/nl_wordlist.combined.gz +++ b/dictionaries/nl_wordlist.combined.gz diff --git a/dictionaries/pl_wordlist.combined.gz b/dictionaries/pl_wordlist.combined.gz Binary files differindex 638c8eef5..12d523811 100644 --- a/dictionaries/pl_wordlist.combined.gz +++ b/dictionaries/pl_wordlist.combined.gz diff --git a/dictionaries/pt_BR_wordlist.combined.gz b/dictionaries/pt_BR_wordlist.combined.gz Binary files differindex 6f7952004..19394cb79 100644 --- a/dictionaries/pt_BR_wordlist.combined.gz +++ b/dictionaries/pt_BR_wordlist.combined.gz diff --git a/dictionaries/pt_PT_wordlist.combined.gz b/dictionaries/pt_PT_wordlist.combined.gz Binary files differindex d60a2fc4f..b29e4fd10 100644 --- a/dictionaries/pt_PT_wordlist.combined.gz +++ b/dictionaries/pt_PT_wordlist.combined.gz diff --git a/dictionaries/ru_wordlist.combined.gz b/dictionaries/ru_wordlist.combined.gz Binary files differindex c589aaa97..9fa7da5d4 100644 --- a/dictionaries/ru_wordlist.combined.gz +++ b/dictionaries/ru_wordlist.combined.gz diff --git a/dictionaries/sl_wordlist.combined.gz b/dictionaries/sl_wordlist.combined.gz Binary files differindex 845b55a8b..c12e7cb66 100644 --- a/dictionaries/sl_wordlist.combined.gz +++ b/dictionaries/sl_wordlist.combined.gz diff --git a/dictionaries/sr_wordlist.combined.gz b/dictionaries/sr_wordlist.combined.gz Binary files differindex c15bc48fd..bb85796b3 100644 --- a/dictionaries/sr_wordlist.combined.gz +++ b/dictionaries/sr_wordlist.combined.gz diff --git a/dictionaries/sv_wordlist.combined.gz b/dictionaries/sv_wordlist.combined.gz Binary files differindex ec399fbf5..b10c14b20 100644 --- a/dictionaries/sv_wordlist.combined.gz +++ b/dictionaries/sv_wordlist.combined.gz diff --git a/dictionaries/tr_wordlist.combined.gz b/dictionaries/tr_wordlist.combined.gz Binary files differindex 3e6ca3263..b33041559 100644 --- a/dictionaries/tr_wordlist.combined.gz +++ b/dictionaries/tr_wordlist.combined.gz diff --git a/java/res/raw/main_de.dict b/java/res/raw/main_de.dict Binary files differindex 59df8b829..a59f7823e 100644 --- a/java/res/raw/main_de.dict +++ b/java/res/raw/main_de.dict diff --git a/java/res/raw/main_en.dict b/java/res/raw/main_en.dict Binary files differindex 14dda8d83..e2fd2585e 100644 --- a/java/res/raw/main_en.dict +++ b/java/res/raw/main_en.dict diff --git a/java/res/raw/main_es.dict b/java/res/raw/main_es.dict Binary files differindex c010da343..ac15d3992 100644 --- a/java/res/raw/main_es.dict +++ b/java/res/raw/main_es.dict diff --git a/java/res/raw/main_fr.dict b/java/res/raw/main_fr.dict Binary files differindex ce4e199b4..5aed479c6 100644 --- a/java/res/raw/main_fr.dict +++ b/java/res/raw/main_fr.dict diff --git a/java/res/raw/main_it.dict b/java/res/raw/main_it.dict Binary files differindex 59b78d643..e289cefbe 100644 --- a/java/res/raw/main_it.dict +++ b/java/res/raw/main_it.dict diff --git a/java/res/raw/main_pt_br.dict b/java/res/raw/main_pt_br.dict Binary files differindex 2a8af6f6e..28db0ed74 100644 --- a/java/res/raw/main_pt_br.dict +++ b/java/res/raw/main_pt_br.dict diff --git a/java/res/raw/main_ru.dict b/java/res/raw/main_ru.dict Binary files differindex 8a1d215a3..011f22e10 100644 --- a/java/res/raw/main_ru.dict +++ b/java/res/raw/main_ru.dict |