From 3a6806ab192fb1e37c47869e36199c6cf7e435f7 Mon Sep 17 00:00:00 2001 From: Jehan Date: Thu, 15 Dec 2022 15:11:17 +0100 Subject: [PATCH] =?UTF-8?q?test:=20no:utf-8=20is=20actually=20working=20no?= =?UTF-8?q?w,=20after=20the=20last=20model=20script=20fix=E2=80=A6?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit … and rebuild of models. The scores are really not bad now, 0.896026 for Norwegian and 0.877947 for Danish. It looks like the last confidence computation changes I did are really giving fruits! --- test/CMakeLists.txt | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/test/CMakeLists.txt b/test/CMakeLists.txt index d996676..a059044 100644 --- a/test/CMakeLists.txt +++ b/test/CMakeLists.txt @@ -38,8 +38,7 @@ foreach(dir ${dirs}) "${lang}:${charset}" STREQUAL "ja:utf-16be" OR "${lang}:${charset}" STREQUAL "es:iso-8859-15" OR "${lang}:${charset}" STREQUAL "da:iso-8859-1" OR - "${lang}:${charset}" STREQUAL "he:iso-8859-8" OR - "${lang}:${charset}" STREQUAL "no:utf-8") + "${lang}:${charset}" STREQUAL "he:iso-8859-8") message(STATUS "Skipping test ${lang}:${charset} (known broken)") else() add_test(NAME "${lang}:${charset}" COMMAND uchardet-tests ${file})