From c5b5a83b4f819bae9a93640b03040b1b0b2f306b Mon Sep 17 00:00:00 2001 From: Weng Xuetian Date: Mon, 13 Jan 2025 13:48:17 -0800 Subject: [PATCH] Update language model with unigram score based on frequency (#80) --- data/CMakeLists.txt | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/data/CMakeLists.txt b/data/CMakeLists.txt index a9029d1..2b16766 100644 --- a/data/CMakeLists.txt +++ b/data/CMakeLists.txt @@ -1,9 +1,9 @@ -set(LM_TAR "lm_sc.arpa-20241001.tar.zst") +set(LM_TAR "lm_sc.arpa-20250113.tar.zst") # Use our own file server for convenience. set(LM_URL "https://download.fcitx-im.org/data/${LM_TAR}") fcitx5_download(lm-download ${LM_URL} ${LM_TAR} - 54934e73966eb38ea4fe8eae9c61dfe486af37da1cb5316a06b19c7d289e3063) + ee83ecf20d52e8bccdba4cf6cd57183d53c257713a5eb77ee3a63d50fc3796dd) fcitx5_extract(lm-extract ${LM_TAR} DEPENDS lm-download OUTPUT lm_sc.arpa)