script: regenerate Slovak and Slovene with better alphabet support.

I was missing some characters, especially in the Slovak alphabet.
Oppositely the Slovene alphabet does not use 4 of the common ASCII
alphabet.
This commit is contained in:
Jehan 2021-03-21 13:30:41 +01:00
parent adb158b058
commit ba7d72e3b0
6 changed files with 587 additions and 558 deletions

View File

@ -1,156 +1,175 @@
= Logs of language model for Slovak (sk) = = Logs of language model for Slovak (sk) =
- Generated by BuildLangModel.py - Generated by BuildLangModel.py
- Started: 2021-03-16 20:04:01.478267 - Started: 2021-03-21 12:48:41.368218
- Maximum depth: 4 - Maximum depth: 4
- Max number of pages: 100 - Max number of pages: 100
== Parsed pages == == Parsed pages ==
Dôkaz (matematika) (revision 7170221) Európska_únia (revision 7169513)
1825 (revision 6937105) 1. decembra (revision 6792273)
1839 (revision 6804159) 1. júl (revision 7066144)
1847 (revision 7167629) 1. svetová vojna (revision 7159151)
1852 (revision 6923466) 10 centov (euro) (revision 6293215)
1878 (revision 7159904) 1952 (revision 7177031)
1955 (revision 7061181) 1957 (revision 7078231)
1976 (revision 7100059) 1958 (revision 7144704)
1983 (revision 7174204) 1960 (revision 7163978)
1967 (revision 7016805)
1968 (revision 7173483)
1973 (revision 7149623)
1979 (revision 7169115)
1981 (revision 7066520)
1985 (revision 7161691)
1986 (revision 7151177)
1987 (revision 7065067)
1990 (revision 7178863)
1992 (revision 7135542)
1993 (revision 7122277) 1993 (revision 7122277)
1995 (revision 7133683) 1995 (revision 7133683)
2012 (revision 7135523) 1999 (revision 7133241)
Adrien-Marie Legendre (revision 6556308) 1 cent (euro) (revision 6963154)
Algebraická geometria (revision 5964212) 1 euro (revision 6264994)
Algebraická rovnica (revision 6586551) 2003 (revision 7135529)
Algebrické číslo (revision 6382942) 2004 (revision 7149802)
Algoritmus (revision 7100698) 2007 (revision 7135534)
Andrew Wiles (revision 6813255) 2008 (revision 7156084)
Arabi (revision 7124298) 2009 (revision 7135536)
Arabčina (revision 7148041) 2013 (revision 7135522)
Aristoteles (revision 7150270) 2016 (revision 7159554)
Arthur Cayley (revision 6332355) 2017 (revision 7174262)
Axióma (revision 7073489) 20 centov (euro) (revision 6293208)
Babylonia (revision 6432954) 23. jún (revision 7052430)
Bernard Bolzano (revision 6903631) 2 centy (euro) (revision 6963155)
Boh (revision 7166677) 2 eurá (revision 6452782)
Bolzanova veta (revision 6852875) 31. december (revision 7149783)
Bytie (revision 6569833) 50 centov (euro) (revision 6293202)
Byzantská ríša (revision 7168566) 5 centov (euro) (revision 6963157)
Caroline Blundenová (revision 7170221) Acquis communautaire (revision 7033703)
Cauchyho postupnosť (revision 6215169) Al Gore (revision 7146244)
Celé číslo (revision 7047567) Albánsko (revision 7172414)
Charles Hermite (revision 6412828) Americký dolár (revision 7050515)
Daniel Marcus (revision 5291472) Amsterdamská zmluva (revision 7070102)
David Hilbert (revision 5968866) Angličtina (revision 7148052)
Dedukcia (revision 6338099) Angola (revision 7035956)
Definícia (revision 6965423) Antigua a Barbuda (revision 6560340)
Derivácia (funkcia) (revision 7014993) Argentína (revision 7171908)
Desiatková číselná sústava (revision 7047888) Arménsko (revision 7147325)
Diofantická rovnica (revision 6060359) Atény (revision 7150984)
Dynastia Chan (revision 7025657) Austrália (štát) (revision 7154003)
Dôkaz (logika) (revision 5495754) Azory (revision 6595058)
Dôkaz sporom (revision 7051518) Bahrajn (revision 7178284)
Energia (revision 6975312) Bangladéš (revision 7147804)
Eric Weisstein (revision 6054413) Barack Obama (revision 7158748)
Ernst Kummer (revision 6001344) Barbados (revision 7178784)
Európa (revision 7164742) Belgicko (revision 7163339)
Experiment (revision 6354302) Belgický frank (revision 6953531)
Fenomén (filozofia) (revision 6558128) Belize (revision 7156055)
Filozofia (revision 6942330) Benin (revision 7172640)
Formula (logika) (revision 3916562) Bolívia (revision 7111159)
Formálny dôkaz (revision 7170221) Botswana (revision 7158699)
Formálny jazyk (revision 6505890) Brazília (revision 7177507)
Gabriel Cramer (revision 7068001) Brettonwoodská menová sústava (revision 6710540)
Galoisova teória (revision 6749172) Brunej (revision 6975045)
Gentzenovský kalkul (revision 7170221) Brusel (revision 7037073)
Geometria (revision 7010499) Bulharsko (revision 7177290)
Geometrický dôkaz (revision 7170221) Bulharský lev (revision 6230899)
Georg Ferdinand Cantor (revision 6697670) Bulharčina (revision 7150125)
Giordano Bruno (revision 7072808) Burkina (revision 7158783)
Gottlob Frege (revision 6580699) Burundi (revision 7049945)
Gödelova veta o neúplnosti (revision 6968373) Ceuta (revision 6575679)
Hardvér (revision 6946820) Charles Michel (revision 7098830)
Henri Poincaré (revision 6830074) Chorvátska kuna (revision 6935490)
Hilbertovský kalkul (revision 7170221) Chorvátsko (revision 7131429)
Hmotnosť (revision 7021343) Chorvátčina (revision 7178832)
Hypotéza (revision 6850461) Clo (revision 6894735)
Idea (revision 6113421) Cyperská libra (revision 5964697)
India (revision 6976622) Cyprus (revision 7035263)
Intuícia (revision 5837951) David-Maria Sassoli (revision 7032560)
Jazyk (lingvistika) (revision 6462864) David Cameron (revision 7078464)
John Taylor (revision 6741201) Demokracia (revision 7049807)
Kardinálne číslo (revision 7154031) Denis Mukwege (revision 6800186)
Kenneth Appel (revision 5968422) Dominika (štát) (revision 7126694)
Klasická mechanika (revision 6295646) Dominikánska republika (revision 7080374)
Konečná množina (revision 6850487) Drachma (novoveké Grécko) (revision 6391564)
Konfucianizmus (revision 6948500) Druhá svetová vojna (revision 7151355)
Kresťanstvo (revision 7150939) Dunaj (revision 7150320)
Latinčina (revision 7110742) Dánska koruna (revision 6125942)
Leonhard Euler (revision 7016638) Dánsko (revision 7161625)
Lineárna algebra (revision 6564030) Dánčina (revision 6557304)
Logická axióma (revision 5495754) Džibutsko (revision 7111764)
Logický kalkul (revision 1608550) EHS (revision 6927031)
Eduard Kukan (revision 7079321)
Egypt (revision 7151318)
Ekvádor (revision 7073543)
Ellen Johnsonová- Sirleafová (revision 7151906)
Estónska koruna (revision 6751629)
Estónsko (revision 7148919)
== End of Parsed pages == == End of Parsed pages ==
- Wikipedia parsing ended at: 2021-03-16 20:13:09.022092 - Wikipedia parsing ended at: 2021-03-21 13:00:32.553701
64 characters appeared 535286 times. 70 characters appeared 674892 times.
First 46 characters: Most Frequent characters:
[ 0] Char o: 8.787265125559047 % [ 0] Char a: 8.935503754674821 %
[ 1] Char a: 8.624174740232323 % [ 1] Char o: 8.347409659619613 %
[ 2] Char e: 8.577470735270492 % [ 2] Char e: 8.052103151319026 %
[ 3] Char n: 6.100103496074995 % [ 3] Char n: 6.170320584626874 %
[ 4] Char i: 5.884891441210867 % [ 4] Char r: 6.046300741451965 %
[ 5] Char t: 5.302772723366575 % [ 5] Char i: 5.852195610556948 %
[ 6] Char r: 5.02273550961542 % [ 6] Char s: 5.3632284869282785 %
[ 7] Char s: 4.340670221152805 % [ 7] Char k: 4.751278723114217 %
[ 8] Char k: 4.253240323864252 % [ 8] Char t: 4.600439774067555 %
[ 9] Char v: 4.073896944810811 % [ 9] Char l: 4.167037096305779 %
[10] Char l: 3.6208680966810265 % [10] Char v: 4.090580418792933 %
[11] Char d: 3.3796886150581185 % [11] Char m: 3.1385762462734776 %
[12] Char m: 3.248356953105443 % [12] Char d: 2.7853345424156752 %
[13] Char p: 2.8470761424733695 % [13] Char u: 2.7336225647955525 %
[14] Char u: 2.6178528861206907 % [14] Char p: 2.6873929458342967 %
[15] Char c: 2.426740097816868 % [15] Char c: 2.5881178025521123 %
[16] Char z: 2.104856095619912 % [16] Char á: 2.0701089952170126 %
[17] Char h: 2.080570013039758 % [17] Char h: 2.0477350450146097 %
[18] Char j: 2.0389100406138025 % [18] Char j: 1.9521641981235516 %
[19] Char á: 1.675926514050433 % [19] Char b: 1.921344452149381 %
[20] Char b: 1.6690143213160817 % [20] Char z: 1.6398179264237835 %
[21] Char y: 1.6607944164427988 % [21] Char y: 1.3830361005909093 %
[22] Char ý: 1.2490519086992748 % [22] Char ý: 1.2827237543192096 %
[23] Char í: 1.1096871578931637 % [23] Char í: 0.8906610242824038 %
[24] Char č: 0.9322119390381964 % [24] Char č: 0.8473948424340486 %
[25] Char é: 0.8785957413420117 % [25] Char é: 0.7884224438873183 %
[26] Char ž: 0.7489454235679618 % [26] Char ú: 0.7808656792494206 %
[27] Char ú: 0.702615050645823 % [27] Char g: 0.749897761419605 %
[28] Char f: 0.6794498641847535 % [28] Char f: 0.6475110091688744 %
[29] Char š: 0.6790762321450589 % [29] Char š: 0.6189138410293795 %
[30] Char g: 0.6219105300717748 % [30] Char ž: 0.4720755320851336 %
[31] Char ť: 0.4550838243481055 % [31] Char ľ: 0.4089543215803418 %
[32] Char ô: 0.38428055282596596 % [32] Char ó: 0.3095310064425123 %
[33] Char ľ: 0.3648516867618432 % [33] Char ť: 0.24344635882481935 %
[34] Char ó: 0.23090460053130477 % [34] Char w: 0.11735210967088068 %
[35] Char x: 0.22922325635267876 % [35] Char ô: 0.10297943967331069 %
[36] Char ň: 0.09434209002290364 % [36] Char ä: 0.09142203493299668 %
[37] Char w: 0.08855079340763629 % [37] Char x: 0.08312441101687382 %
[38] Char ä: 0.07005600744275023 % [38] Char ň: 0.07201152184349496 %
[39] Char ď: 0.06706695112519288 % [39] Char ď: 0.06993711586446424 %
[40] Char q: 0.018121153925191393 % [40] Char q: 0.017187935254825957 %
[41] Char ĺ: 0.010274881091603367 % [41] Char ë: 0.011112889173378852 %
[42] Char ě: 0.010274881091603367 % [42] Char ř: 0.010075686183863493 %
[43] Char ö: 0.010088065071756034 % [43] Char ü: 0.009186655049993185 %
[44] Char ř: 0.007285824774046024 % [44] Char ě: 0.008445795771767926 %
[45] Char ŕ: 0.006351744674809354 % [45] Char ö: 0.007260420926607517 %
[46] Char ĺ: 0.006371389792737208 %
[47] Char ć: 0.006223217937092157 %
[48] Char ŕ: 0.0044451556693515405 %
The first 46 characters have an accumulated ratio of 0.9998617561453131. The first 49 characters have an accumulated ratio of 0.9998118217433309.
1198 sequences found. 1410 sequences found.
First 512 (typical positive ratio): 0.9724967373205526 First 773 (typical positive ratio): 0.9950030300775062
Next 512 (512-1024): 0.007489454235679618 Next 277 (1050-773): 0.003999347913144824
Rest: 0.00042527339003644096 Rest: 0.0009976220093489419
- Processing end: 2021-03-16 20:13:09.628753 - Processing end: 2021-03-21 13:00:33.050085

View File

@ -1,146 +1,150 @@
= Logs of language model for Slovene (sl) = = Logs of language model for Slovene (sl) =
- Generated by BuildLangModel.py - Generated by BuildLangModel.py
- Started: 2021-03-16 20:13:09.868611 - Started: 2021-03-21 12:30:22.611188
- Maximum depth: 4 - Maximum depth: 4
- Max number of pages: 100 - Max number of pages: 100
== Parsed pages == == Parsed pages ==
XCOM: Enemy Unknown (revision 5360018) Ljubljana (revision 5468628)
1UP.com (revision 5138164) 1689 (revision 4230028)
2K Games (revision 4110089) 1918 (revision 5249637)
Android (operacijski sistem) (revision 5423518) 1926 (revision 5456617)
Animator videoigre (revision 5438736) 1929 (revision 5444196)
App Store (revision 4916505) 1930. (revision 5118014)
Artefakt (revision 4871634) 2011 (revision 5469547)
Athlon (revision 5138170) 25. junij (revision 5447338)
Avstralazija (revision 5234981) A1 (radio) (revision 5360678)
Avtopsija (revision 5394899) ACH Volley (revision 5089458)
Bralno-pisalni pomnilnik (revision 5307992) AKC Metelkova mesto (revision 5323280)
Civilization (serija) (revision 5138157) Abecedarium (revision 5092193)
Deus Ex: Human Revolution (revision 5312201) Academia operosorum Labacensis (revision 5228146)
DirectX (revision 4477913) Adam Bohorič (revision 5414191)
Dishonored (revision 5359830) Ajdovščina (revision 5423173)
Edge (magazine) (revision 5356455) Albert Kosmač (revision 5368699)
Enoigralska videoigra (revision 5116872) Albin Belar (revision 5197298)
Eurogamer (revision 5312201) Aleksander Bajt (revision 4917916)
Evropa (revision 5448355) Aleksandrija (revision 5405515)
Fantasy Flight Games (revision 4649361) Aleš Kunaver (revision 5029295)
Firaxis Games (revision 4110089) Alojzij Šuštar (revision 5442498)
Francoska narodna knjižnica (revision 4596643) Alpe (revision 5464842)
GameRankings (revision 3934020) Amsterdam (revision 5359727)
GameSpot (revision 5116871) Anastasius Grün (revision 5070788)
GameSpy (revision 5168684) Andorra la Vella (revision 5390252)
GameTrailers (revision 5298120) Andrej Fleischmann (revision 4930149)
Game Informer (revision 5360018) Andrej Smole (revision 5467820)
GamesTM (revision 5360018) Angela Vode (revision 5466809)
Grafična kartica (revision 5374734) Anica Cevc (revision 5414746)
Granata (revision 4837685) Anja Bukovec (revision 5041799)
Holografija (revision 4760425) Anton Aleksander Auersperg (revision 5070788)
IGN (revision 5370204) Anton Alojzij Wolf (revision 5361749)
IOS (revision 5404204) Anton Bitenc (revision 5463597)
Igra igranja vlog (revision 4768087) Anton Bonaventura Jeglič (revision 5414522)
Igra na deski (revision 5431955) Anton Cerar (revision 5376771)
Igralna konzola (revision 4773547) Anton Codelli (izumitelj) (revision 5161385)
Igralni pogon (revision 4771045) Anton Foerster (revision 5270593)
Intel (revision 5366957) Anton Gvajc (revision 5035801)
International Standard Book Number (revision 4765322) Anton Lajovic (revision 4867406)
Izdelovalec videoigre (revision 5438736) Anton Melik (revision 5272303)
Joker (revija) (revision 5351778) Anton Ocvirk (revision 5470942)
Kotaku (revision 4613535) Anton Peterlin (revision 4979305)
Kristal (revision 5068718) Anton Stres (revision 5464457)
Linux (revision 5457231) Anton Tomaž Linhart (revision 5413399)
Lovec prestreznik (revision 4758667) Anton Verovšek (revision 5412417)
MTV (revision 5406174) Anton Vodnik (revision 5180239)
Mac OS X (revision 5212452) Anton Šivic (revision 5410565)
Machinima (revision 5295004) Antwerpen (revision 5375367)
Major (revision 4758895) Arena Stožice (revision 5462141)
Mednarodna različica (revision 5032649) Argentinski park, Ljubljana (revision 5398130)
Metacritic (revision 3934020) Argonavti (revision 5425545)
Michael McCann (skladatelj) (revision 5312201) Arne Hodalič (revision 5417283)
MicroProse (revision 5116826) Art nouveau (revision 5371096)
Microsoft Windows (revision 5460799) Ateizem (revision 5427207)
Možje v črnem (revision 5262890) Atene (revision 5360039)
Nezemeljsko življenje (revision 5386002) Ati Soss (revision 5463553)
Normativna kontrola (revision 5316351) Atila (revision 5425308)
NowGamer (revision 5363253) Avgusta Danilova (revision 4788392)
OS X (revision 5212452) Avstro-Ogrska (revision 5431606)
Ognjena ekipa (revision 4694450) Avtobusna postaja Ljubljana (revision 4479008)
Operacijski sistem (revision 5309675) Avtocesta A1 (revision 5292269)
Ostrostrelec (revision 4810396) Avtocesta A2 (revision 5387166)
Pilot (revision 4758828) Aškerčeva cesta, Ljubljana (revision 4578067)
PlayStation 3 (revision 5245525) BTC (revision 5450525)
PlayStation Network (revision 4784984) Bajer (potok) (revision 5147457)
PlayStation Vita (revision 5245581) Bakrorez (revision 5375208)
Procesor (revision 5262718) Bangkok (revision 5378204)
Producent videoiger (revision 5368686) Barje (revision 5180470)
Razvijalec videoiger (revision 5171689) Barok (revision 5463042)
Računalniška miška (revision 5169871) Bejrut (revision 5356724)
Računalniško okolje (revision 5250619) Benetke (revision 5424094)
Severna Amerika (revision 5400891) Beograd (revision 5448139)
Sid Meier (revision 4061487) Berlin (revision 5435344)
Stealth (revision 4618630) Bern (revision 5466493)
Steam (revision 5171704) Biblija (revision 5404188)
Strateška videoigra (revision 5245834) Bicike(lj) (revision 5468628)
Tablični računalnik (revision 5312221) Bine Rogelj (revision 5086972)
Telepatija (revision 4846742) Biodiverziteta (revision 5352270)
The Bureau: XCOM Declassified (revision 5360018) Bizoviški potok (revision 5305268)
The Guardian (revision 5361337) Bled (revision 5469179)
Trdi disk (revision 5329681) Bleiweisova cesta, Ljubljana (revision 5184903)
UFO: Enemy Unknown (revision 5360018) Bogo Grafenauer (revision 5311308)
Unreal Engine (revision 4771045) Bogota (revision 5363243)
Unreal Engine 3 (revision 4771045) Bojan Adamič (revision 5409135)
Uporabniški vmesnik (revision 5118420) Bojan Čop (revision 5247252)
Valve Corporation (revision 5168680) Bojan Štih (revision 5305724)
Večigralska videoigra (revision 4618639) Boris Kobe (revision 5296972)
VideoGamer.com (revision 5363253) Boris Sket (revision 5413264)
Vohunski satelit (revision 5450401) Borut Lesjak (revision 5273043)
Vojaška taktika (revision 4759159) Botanični vrt, Ljubljana (revision 5142111)
Botanični vrt Ljubljana (revision 5142111)
Botanični vrt Univerze v Ljubljani (revision 5142111)
Bovec (revision 5330651)
Boštjan Putrih (revision 5124433)
Boštjan Žekš (revision 5415317)
Božena Ravnihar (revision 5415042)
Božo Vodušek (revision 5122962)
Božo Škerlj (revision 5268384)
== End of Parsed pages == == End of Parsed pages ==
- Wikipedia parsing ended at: 2021-03-16 20:20:05.416719 - Wikipedia parsing ended at: 2021-03-21 12:38:56.631283
41 characters appeared 318060 times. 57 characters appeared 519434 times.
First 29 characters: Most Frequent characters:
[ 0] Char a: 10.018235553040308 % [ 0] Char e: 10.223242991409881 %
[ 1] Char e: 9.988995786958435 % [ 1] Char a: 10.130257164529084 %
[ 2] Char i: 9.602590706156072 % [ 2] Char i: 8.972265966417293 %
[ 3] Char o: 9.246054203609381 % [ 3] Char o: 8.507144314773388 %
[ 4] Char n: 7.188580770923725 % [ 4] Char n: 7.334329289187846 %
[ 5] Char r: 5.758976293781048 % [ 5] Char r: 5.438226993227244 %
[ 6] Char s: 4.588442432245488 % [ 6] Char s: 5.162157271183634 %
[ 7] Char t: 4.5786958435515315 % [ 7] Char l: 5.052614961669818 %
[ 8] Char l: 4.357668364459536 % [ 8] Char t: 4.829679997843807 %
[ 9] Char j: 4.260202477519965 % [ 9] Char j: 4.445223069725894 %
[10] Char v: 3.809344148902723 % [10] Char v: 4.3826549667522725 %
[11] Char p: 3.4980821228698984 % [11] Char k: 3.543664835185991 %
[12] Char k: 3.4751304785260646 % [12] Char d: 3.1351432520782234 %
[13] Char d: 3.143746462931522 % [13] Char p: 2.8430945991213514 %
[14] Char m: 2.928692699490662 % [14] Char m: 2.7564618411578756 %
[15] Char z: 2.332893164811671 % [15] Char u: 2.3069340859473964 %
[16] Char u: 1.9908193422624663 % [16] Char z: 2.0064146744340956 %
[17] Char g: 1.9298245614035088 % [17] Char b: 1.937300985303234 %
[18] Char b: 1.5607118153807458 % [18] Char g: 1.6027060223242993 %
[19] Char c: 1.2903225806451613 % [19] Char h: 1.1235306121663196 %
[20] Char h: 1.2145507137018172 % [20] Char č: 1.0794441642249064 %
[21] Char č: 1.1001068980695468 % [21] Char c: 1.048256371358055 %
[22] Char š: 0.6841476450984091 % [22] Char š: 0.9687467512715764 %
[23] Char ž: 0.44331258253159783 % [23] Char ž: 0.5263421339380941 %
[24] Char f: 0.4203609381877633 % [24] Char f: 0.41391206582549467 %
[25] Char w: 0.2021631138778847 %
[26] Char y: 0.19618939822674966 %
[27] Char x: 0.16726403823178018 %
[28] Char q: 0.011004213041564485 %
The first 29 characters have an accumulated ratio of 0.9998710935043701. The first 25 characters have an accumulated ratio of 0.9976974938105708.
698 sequences found. 880 sequences found.
First 512 (typical positive ratio): 0.998296272473889 First 449 (typical positive ratio): 0.9950499684040537
Next 512 (512-1024): 0.004433125825315978 Next 172 (621-449): 0.003957684836286113
Rest: -2.8189256484623115e-17 Rest: 0.000992346759660201
- Processing end: 2021-03-16 20:20:05.900813 - Processing end: 2021-03-21 12:38:56.993560

View File

@ -58,10 +58,8 @@ charsets = ['ISO-8859-2', 'Windows-1250', 'IBM852', 'MAC-CENTRALEUROPE']
# If use_ascii=True, there is no need to add any ASCII characters. # If use_ascii=True, there is no need to add any ASCII characters.
# If case_mapping=True, there is no need to add several cases of a same # If case_mapping=True, there is no need to add several cases of a same
# character (provided Python algorithms know the right cases). # character (provided Python algorithms know the right cases).
alphabet = 'áäčďĺľňóŕšťúýž' alphabet = 'áäčďéíĺľňóôŕšťúýž'
# The starred page which was rewarded on the main page when I created start_pages = ['Európska_únia']
# the data.
start_pages = ['Dôkaz (matematika)']
# give possibility to select another code for the Wikipedia URL. # give possibility to select another code for the Wikipedia URL.
wikipedia_code = code wikipedia_code = code
# 'a' and 'A' will be considered the same character, and so on. # 'a' and 'A' will be considered the same character, and so on.

View File

@ -44,16 +44,20 @@ import re
name = 'Slovene' name = 'Slovene'
code = 'sl' code = 'sl'
use_ascii = True # ASCII is used except q and w, x and y according to Wikipedia.
use_ascii = False
charsets = ['ISO-8859-2', 'ISO-8859-16', charsets = ['ISO-8859-2', 'ISO-8859-16',
'Windows-1250', 'IBM852', 'MAC-CENTRALEUROPE'] 'Windows-1250', 'IBM852', 'MAC-CENTRALEUROPE']
## Optional Properties ## ## Optional Properties ##
# Alphabet characters. # Alphabet characters.
alphabet = 'čšž' # XXX According to Wikipedia there are 2 incompatible diacritics
# The starred page which was rewarded on the main page when I created # systems, but both seem barely used on Wikipedia (even though I can see
# the data. # some usage here or there, on some titles), so I assume these don't
start_pages = ['XCOM: Enemy Unknown'] # exist. Maybe this would have to be separate models for variants of
# the language.
alphabet = 'abcčdefghijklmnoprsštuvzž'
start_pages = ['Ljubljana']
wikipedia_code = code wikipedia_code = code
case_mapping = True case_mapping = True

View File

@ -42,7 +42,7 @@
/** /**
* Generated by BuildLangModel.py * Generated by BuildLangModel.py
* On: 2021-03-16 20:13:09.022988 * On: 2021-03-21 13:00:32.554155
**/ **/
/* Character Mapping Table: /* Character Mapping Table:
@ -68,18 +68,18 @@ static const unsigned char Iso_8859_2_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 1, 20, 15, 11, 2, 28, 30, 17, 4, 18, 8, 10, 12, 3, 0, /* 4X */ SYM, 0, 19, 15, 12, 2, 28, 27, 17, 5, 18, 7, 9, 11, 3, 1, /* 4X */
13, 40, 6, 7, 5, 14, 9, 37, 35, 21, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */ 14, 40, 4, 6, 8, 13, 10, 34, 37, 21, 20,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 1, 20, 15, 11, 2, 28, 30, 17, 4, 18, 8, 10, 12, 3, 0, /* 6X */ SYM, 0, 19, 15, 12, 2, 28, 27, 17, 5, 18, 7, 9, 11, 3, 1, /* 6X */
13, 40, 6, 7, 5, 14, 9, 37, 35, 21, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */ 14, 40, 4, 6, 8, 13, 10, 34, 37, 21, 20,SYM,SYM,SYM,SYM,CTR, /* 7X */
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 8X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 8X */
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 9X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 9X */
SYM, 64,SYM, 49,SYM, 33, 65,SYM,SYM, 29, 59, 31, 66,SYM, 26, 61, /* AX */ SYM, 70,SYM, 50,SYM, 31, 58,SYM,SYM, 29, 54, 33, 71,SYM, 30, 63, /* AX */
SYM, 67,SYM, 49,SYM, 33, 68,SYM,SYM, 29, 59, 31, 69,SYM, 26, 61, /* BX */ SYM, 72,SYM, 50,SYM, 31, 58,SYM,SYM, 29, 54, 33, 73,SYM, 30, 63, /* BX */
45, 19, 70, 55, 38, 41, 47, 50, 24, 25, 57, 51, 42, 23, 71, 39, /* CX */ 48, 16, 66, 51, 36, 46, 47, 49, 24, 25, 56, 41, 44, 23, 61, 39, /* CX */
53, 54, 36, 34, 32, 62, 43,SYM, 44, 48, 27, 56, 46, 22, 72, 60, /* DX */ 57, 53, 38, 32, 35, 55, 45,SYM, 42, 52, 26, 74, 43, 22, 68, 59, /* DX */
45, 19, 73, 55, 38, 41, 47, 50, 24, 25, 57, 51, 42, 23, 74, 39, /* EX */ 48, 16, 66, 51, 36, 46, 47, 49, 24, 25, 56, 41, 44, 23, 61, 39, /* EX */
53, 54, 36, 34, 32, 62, 43,SYM, 44, 48, 27, 56, 46, 22, 75,SYM, /* FX */ 57, 53, 38, 32, 35, 55, 45,SYM, 42, 52, 26, 75, 43, 22, 68,SYM, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
@ -89,18 +89,18 @@ static const unsigned char Windows_1250_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 1, 20, 15, 11, 2, 28, 30, 17, 4, 18, 8, 10, 12, 3, 0, /* 4X */ SYM, 0, 19, 15, 12, 2, 28, 27, 17, 5, 18, 7, 9, 11, 3, 1, /* 4X */
13, 40, 6, 7, 5, 14, 9, 37, 35, 21, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */ 14, 40, 4, 6, 8, 13, 10, 34, 37, 21, 20,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 1, 20, 15, 11, 2, 28, 30, 17, 4, 18, 8, 10, 12, 3, 0, /* 6X */ SYM, 0, 19, 15, 12, 2, 28, 27, 17, 5, 18, 7, 9, 11, 3, 1, /* 6X */
13, 40, 6, 7, 5, 14, 9, 37, 35, 21, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */ 14, 40, 4, 6, 8, 13, 10, 34, 37, 21, 20,SYM,SYM,SYM,SYM,CTR, /* 7X */
SYM,ILL,SYM,ILL,SYM,SYM,SYM,SYM,ILL,SYM, 29,SYM, 76, 31, 26, 77, /* 8X */ SYM,ILL,SYM,ILL,SYM,SYM,SYM,SYM,ILL,SYM, 29,SYM, 58, 33, 30, 76, /* 8X */
ILL,SYM,SYM,SYM,SYM,SYM,SYM,SYM,ILL,SYM, 29,SYM, 78, 31, 26, 79, /* 9X */ ILL,SYM,SYM,SYM,SYM,SYM,SYM,SYM,ILL,SYM, 29,SYM, 58, 33, 30, 77, /* 9X */
SYM,SYM,SYM, 49,SYM, 80,SYM,SYM,SYM,SYM, 59,SYM,SYM,SYM,SYM, 61, /* AX */ SYM,SYM,SYM, 50,SYM, 78,SYM,SYM,SYM,SYM, 54,SYM,SYM,SYM,SYM, 63, /* AX */
SYM,SYM,SYM, 49,SYM,SYM,SYM,SYM,SYM, 81, 59,SYM, 33,SYM, 33, 61, /* BX */ SYM,SYM,SYM, 50,SYM,SYM,SYM,SYM,SYM, 79, 54,SYM, 31,SYM, 31, 63, /* BX */
45, 19, 82, 55, 38, 41, 47, 50, 24, 25, 57, 51, 42, 23, 83, 39, /* CX */ 48, 16, 66, 51, 36, 46, 47, 49, 24, 25, 56, 41, 44, 23, 61, 39, /* CX */
53, 54, 36, 34, 32, 62, 43,SYM, 44, 48, 27, 56, 46, 22, 84, 60, /* DX */ 57, 53, 38, 32, 35, 55, 45,SYM, 42, 52, 26, 80, 43, 22, 68, 59, /* DX */
45, 19, 85, 55, 38, 41, 47, 50, 24, 25, 57, 51, 42, 23, 86, 39, /* EX */ 48, 16, 66, 51, 36, 46, 47, 49, 24, 25, 56, 41, 44, 23, 61, 39, /* EX */
53, 54, 36, 34, 32, 62, 43,SYM, 44, 48, 27, 56, 46, 22, 87,SYM, /* FX */ 57, 53, 38, 32, 35, 55, 45,SYM, 42, 52, 26, 81, 43, 22, 68,SYM, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
@ -110,18 +110,18 @@ static const unsigned char Ibm852_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 1, 20, 15, 11, 2, 28, 30, 17, 4, 18, 8, 10, 12, 3, 0, /* 4X */ SYM, 0, 19, 15, 12, 2, 28, 27, 17, 5, 18, 7, 9, 11, 3, 1, /* 4X */
13, 40, 6, 7, 5, 14, 9, 37, 35, 21, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */ 14, 40, 4, 6, 8, 13, 10, 34, 37, 21, 20,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 1, 20, 15, 11, 2, 28, 30, 17, 4, 18, 8, 10, 12, 3, 0, /* 6X */ SYM, 0, 19, 15, 12, 2, 28, 27, 17, 5, 18, 7, 9, 11, 3, 1, /* 6X */
13, 40, 6, 7, 5, 14, 9, 37, 35, 21, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */ 14, 40, 4, 6, 8, 13, 10, 34, 37, 21, 20,SYM,SYM,SYM,SYM,CTR, /* 7X */
50, 46, 25, 88, 38, 48, 47, 50, 49, 51, 62, 62, 89, 90, 38, 47, /* 8X */ 49, 43, 25, 66, 36, 52, 47, 49, 50, 41, 55, 55, 61, 82, 36, 47, /* 8X */
25, 41, 41, 32, 43, 33, 33, 91, 92, 43, 46, 31, 31, 49,SYM, 24, /* 9X */ 25, 46, 46, 35, 45, 31, 31, 58, 58, 45, 43, 33, 33, 50,SYM, 24, /* 9X */
19, 23, 34, 27, 93, 94, 26, 26, 57, 57,SYM, 95, 24, 59,SYM,SYM, /* AX */ 16, 23, 32, 26, 83, 84, 30, 30, 56, 56,SYM, 85, 24, 54,SYM,SYM, /* AX */
SYM,SYM,SYM,SYM,SYM, 19, 96, 42, 59,SYM,SYM,SYM,SYM, 61, 61,SYM, /* BX */ SYM,SYM,SYM,SYM,SYM, 16, 66, 44, 54,SYM,SYM,SYM,SYM, 63, 63,SYM, /* BX */
SYM,SYM,SYM,SYM,SYM,SYM, 55, 55,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* CX */ SYM,SYM,SYM,SYM,SYM,SYM, 51, 51,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* CX */
53, 53, 39, 51, 39, 36, 23, 97, 42,SYM,SYM,SYM,SYM, 98, 48,SYM, /* DX */ 57, 57, 39, 41, 39, 38, 23, 61, 44,SYM,SYM,SYM,SYM, 68, 52,SYM, /* DX */
34, 60, 32, 54, 54, 36, 29, 29, 45, 27, 45, 56, 22, 22, 99,SYM, /* EX */ 32, 59, 35, 53, 53, 38, 29, 29, 48, 26, 48, 86, 22, 22, 68,SYM, /* EX */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, 56, 44, 44,SYM,SYM, /* FX */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, 87, 42, 42,SYM,SYM, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
@ -131,140 +131,148 @@ static const unsigned char Mac_Centraleurope_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 1, 20, 15, 11, 2, 28, 30, 17, 4, 18, 8, 10, 12, 3, 0, /* 4X */ SYM, 0, 19, 15, 12, 2, 28, 27, 17, 5, 18, 7, 9, 11, 3, 1, /* 4X */
13, 40, 6, 7, 5, 14, 9, 37, 35, 21, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */ 14, 40, 4, 6, 8, 13, 10, 34, 37, 21, 20,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 1, 20, 15, 11, 2, 28, 30, 17, 4, 18, 8, 10, 12, 3, 0, /* 6X */ SYM, 0, 19, 15, 12, 2, 28, 27, 17, 5, 18, 7, 9, 11, 3, 1, /* 6X */
13, 40, 6, 7, 5, 14, 9, 37, 35, 21, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */ 14, 40, 4, 6, 8, 13, 10, 34, 37, 21, 20,SYM,SYM,SYM,SYM,CTR, /* 7X */
38, 63, 63, 25,100, 43, 46, 19,101, 24, 38, 24, 47, 47, 25,102, /* 8X */ 36, 69, 69, 25, 88, 45, 43, 16, 89, 24, 36, 24, 47, 47, 25, 90, /* 8X */
103, 39, 23, 39,104,105,106, 34,107, 32, 43,108, 27, 42, 42, 46, /* 9X */ 91, 39, 23, 39, 67, 67, 92, 32, 93, 35, 45, 60, 26, 44, 44, 43, /* 9X */
SYM,SYM, 57,SYM,SYM,SYM,SYM, 60,SYM,SYM,SYM, 57,SYM,SYM,109,110, /* AX */ SYM,SYM, 56,SYM,SYM,SYM,SYM, 59,SYM,SYM,SYM, 56,SYM,SYM, 94, 95, /* AX */
111, 58,SYM,SYM, 58,112,SYM,SYM, 49,113,114, 33, 33, 41, 41,115, /* BX */ 96, 64,SYM,SYM, 64, 97,SYM,SYM, 50, 98, 99, 31, 31, 46, 46,100, /* BX */
116, 54,SYM,SYM, 54, 36,SYM,SYM,SYM,SYM,SYM, 36, 62,117, 62, 52, /* CX */ 101, 53,SYM,SYM, 53, 38,SYM,SYM,SYM,SYM,SYM, 38, 55, 60, 55, 62, /* CX */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, 52, 45, 45, 44,SYM,SYM, 44,118, /* DX */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, 62, 48, 48, 42,SYM,SYM, 42,102, /* DX */
119, 29,SYM,SYM, 29,120,121, 19, 31, 31, 23, 26, 26,122, 34, 32, /* EX */ 103, 29,SYM,SYM, 29, 58, 58, 16, 33, 33, 23, 30, 30, 65, 32, 35, /* EX */
123, 48, 27, 48, 56, 56,124,125, 22, 22,126, 61, 49, 61,127,SYM, /* FX */ 65, 52, 26, 52,104,105,106,107, 22, 22,108, 63, 50, 63,109,SYM, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
static const int Unicode_Char_size = 92; static const int Unicode_Char_size = 98;
static const unsigned int Unicode_CharOrder[] = static const unsigned int Unicode_CharOrder[] =
{ {
65, 1, 66, 20, 67, 15, 68, 11, 69, 2, 70, 28, 71, 30, 72, 17, 65, 0, 66, 19, 67, 15, 68, 12, 69, 2, 70, 28, 71, 27, 72, 17,
73, 4, 74, 18, 75, 8, 76, 10, 77, 12, 78, 3, 79, 0, 80, 13, 73, 5, 74, 18, 75, 7, 76, 9, 77, 11, 78, 3, 79, 1, 80, 14,
81, 40, 82, 6, 83, 7, 84, 5, 85, 14, 86, 9, 87, 37, 88, 35, 81, 40, 82, 4, 83, 6, 84, 8, 85, 13, 86, 10, 87, 34, 88, 37,
89, 21, 90, 16, 97, 1, 98, 20, 99, 15, 100, 11, 101, 2,102, 28, 89, 21, 90, 20, 97, 0, 98, 19, 99, 15, 100, 12, 101, 2,102, 28,
103, 30, 104, 17, 105, 4, 106, 18, 107, 8, 108, 10, 109, 12,110, 3, 103, 27, 104, 17, 105, 5, 106, 18, 107, 7, 108, 9, 109, 11,110, 3,
111, 0, 112, 13, 113, 40, 114, 6, 115, 7, 116, 5, 117, 14,118, 9, 111, 1, 112, 14, 113, 40, 114, 4, 115, 6, 116, 8, 117, 13,118, 10,
119, 37, 120, 35, 121, 21, 122, 16, 193, 19, 196, 38, 201, 25,205, 23, 119, 34, 120, 37, 121, 21, 122, 20, 193, 16, 196, 36, 201, 25,203, 41,
211, 34, 212, 32, 214, 43, 218, 27, 221, 22, 225, 19, 228, 38,233, 25, 205, 23, 211, 32, 212, 35, 214, 45, 218, 26, 220, 43, 221, 22,225, 16,
237, 23, 243, 34, 244, 32, 246, 43, 250, 27, 253, 22, 268, 24,269, 24, 228, 36, 233, 25, 235, 41, 237, 23, 243, 32, 244, 35, 246, 45,250, 26,
270, 39, 271, 39, 282, 42, 283, 42, 313, 41, 314, 41, 317, 33,318, 33, 252, 43, 253, 22, 262, 47, 263, 47, 268, 24, 269, 24, 270, 39,271, 39,
327, 36, 328, 36, 340, 45, 341, 45, 344, 44, 345, 44, 352, 29,353, 29, 282, 44, 283, 44, 313, 46, 314, 46, 317, 31, 318, 31, 327, 38,328, 38,
356, 31, 357, 31, 381, 26, 382, 26, 340, 48, 341, 48, 344, 42, 345, 42, 352, 29, 353, 29, 356, 33,357, 33,
381, 30, 382, 30,
}; };
/* Model Table: /* Model Table:
* Total sequences: 1198 * Total considered sequences: 1410 / 2401
* First 512 sequences: 0.9724967373205526 * - Positive sequences: first 773 (0.9950030300775062)
* Next 512 sequences (512-1024): 0.02707798928941092 * - Probable sequences: next 277 (1050-773) (0.003999347913144824)
* Rest: 0.00042527339003644096 * - Neutral sequences: last 1351 (0.0009976220093489419)
* - Negative sequences: 991 (off-ratio)
* Negative sequences: TODO * Negative sequences: TODO
*/ */
static const PRUint8 SlovakLangModel[] = static const PRUint8 SlovakLangModel[] =
{ {
2,2,2,3,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,2,0, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,0,3,3,3,3,3,0,2,
0,3,2,3,1,3,2,3,1,0,3,0,2,3,2,0,1,2,0,0,0,1,0, 3,0,3,3,3,3,3,3,1,3,3,0,0,3,3,3,2,1,2,0,0,0,0,0,0,
2,2,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,0,3,3,0, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,3,3,0,1,
0,3,0,3,0,3,3,3,3,0,2,1,3,2,2,0,2,2,0,0,0,2,0, 3,2,0,3,3,3,3,3,0,0,3,0,0,3,3,3,1,1,2,1,0,0,0,0,0,
3,3,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,0, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,0,1,
2,3,0,3,2,3,3,3,2,0,3,3,3,3,2,0,3,2,0,0,1,0,0, 3,0,3,3,3,3,3,3,2,3,3,0,0,3,3,3,1,0,1,0,0,0,0,0,0,
3,3,3,3,3,3,2,3,3,2,2,3,2,2,3,3,2,2,2,3,2,3,3, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,3,3,3,3,3,3,
3,3,3,2,3,2,3,3,0,2,0,2,0,0,2,0,0,2,0,2,0,0,0, 3,3,3,3,3,3,3,0,3,0,3,1,1,1,0,1,1,2,0,1,3,1,0,0,0,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,0,0, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,3,3,
3,3,2,3,0,3,3,3,3,0,2,3,2,2,2,0,0,2,0,0,1,2,0, 3,3,3,3,3,3,3,0,3,2,2,3,0,2,2,0,2,2,0,2,0,2,0,0,0,
3,3,3,3,3,2,3,3,3,3,3,1,3,2,3,2,3,3,2,3,3,3,3, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,1,0,3,
3,2,3,0,3,2,2,2,1,0,2,3,0,2,1,2,2,1,1,2,2,0,2, 3,3,2,3,3,3,3,2,3,3,2,0,1,3,1,0,3,1,3,0,0,0,0,3,0,
3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,2,2,2,3,3,3,3, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,2,3,
3,3,3,2,2,2,2,3,2,2,0,3,2,2,2,2,0,2,0,0,2,0,0, 2,3,3,3,3,0,1,2,2,3,3,3,1,0,2,0,2,2,0,1,0,0,0,0,0,
3,3,3,3,3,3,2,3,3,3,3,2,3,3,3,3,2,2,2,3,2,3,2, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,1,3,3,2,1,1,2,3,3,3,
3,2,2,1,3,2,0,2,3,2,2,1,0,2,2,0,0,2,0,0,1,0,0, 2,3,3,1,2,0,1,3,3,0,2,3,1,0,3,0,0,2,2,1,0,2,1,0,0,
3,3,3,2,3,3,3,2,2,3,3,3,2,2,3,3,2,2,2,3,2,3,3, 3,3,3,3,3,3,3,3,3,3,3,3,2,3,1,3,3,3,1,3,3,3,3,3,
2,2,3,2,3,2,2,2,0,3,2,2,0,2,2,0,0,0,0,0,2,2,1, 2,3,3,2,2,2,0,0,3,1,2,1,1,1,2,2,0,2,2,1,2,1,1,0,1,
3,3,3,3,3,2,3,3,2,0,3,3,1,3,3,2,3,2,0,3,2,3,3, 3,3,3,3,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,
3,2,3,2,2,1,3,2,0,2,0,0,0,2,0,3,2,0,2,2,1,2,2, 3,3,3,3,3,3,3,1,3,0,2,2,2,0,2,1,2,0,0,1,0,1,0,0,0,
3,3,3,3,3,3,2,3,3,2,3,2,2,2,3,2,2,2,2,3,2,3,3, 3,3,3,3,3,3,3,3,3,3,1,2,3,3,3,3,3,2,2,3,3,3,3,3,
3,2,3,2,3,2,2,3,0,1,0,3,0,2,0,0,0,0,0,0,0,0,0, 3,3,3,2,1,3,2,0,1,0,0,3,3,0,2,3,0,1,0,0,2,1,0,0,2,
3,3,3,3,3,2,3,3,3,3,3,2,3,3,3,3,3,2,2,3,2,3,3, 3,3,3,3,3,3,3,3,3,3,2,3,2,3,3,3,3,1,2,3,2,3,2,3,
3,2,2,2,2,2,2,2,0,3,3,2,2,2,2,0,0,0,2,2,0,2,0, 2,3,3,1,2,1,2,0,2,0,1,3,3,1,1,0,0,1,0,2,1,0,0,0,2,
3,3,3,3,3,3,2,3,2,0,2,2,3,3,3,2,0,0,2,3,3,3,2, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,
3,1,2,2,2,0,0,1,0,3,0,2,1,1,0,3,0,1,0,0,1,0,2, 2,3,3,3,2,3,3,3,3,0,3,3,1,0,3,0,0,2,2,1,2,1,3,0,1,
3,3,3,3,3,3,3,2,2,0,3,2,2,2,3,2,1,2,0,3,2,2,2, 3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,3,3,3,3,3,0,1,
3,1,2,0,2,2,2,0,2,3,1,2,0,2,0,2,0,0,2,2,0,2,0, 3,1,0,3,3,3,3,2,1,2,2,0,0,3,1,3,2,1,1,0,0,0,0,0,0,
2,2,2,3,2,3,3,3,3,3,3,3,3,3,2,3,3,3,3,3,3,2,0, 3,3,3,3,3,3,3,3,3,3,0,1,2,3,3,3,3,3,1,2,0,3,1,3,
2,3,1,3,1,2,3,3,2,0,2,0,2,1,2,0,2,2,0,0,0,0,0, 2,3,3,0,2,3,0,1,1,2,0,3,3,0,2,0,0,2,0,1,0,1,2,0,0,
3,3,3,3,3,2,2,2,3,2,2,2,1,0,3,2,2,3,0,2,0,2,1, 3,3,3,3,3,3,3,3,3,3,2,1,2,3,1,3,2,3,1,2,3,3,0,3,
3,0,2,0,3,1,0,2,2,0,0,2,0,2,0,0,0,2,0,0,0,0,0, 0,3,3,2,2,0,0,0,1,2,0,0,0,0,1,0,3,1,0,0,0,0,0,0,0,
3,3,3,3,3,2,3,3,3,3,3,3,3,2,3,2,2,3,2,3,2,3,3, 0,1,1,3,3,1,3,3,3,3,3,3,3,2,3,3,0,3,3,3,3,0,0,0,
2,1,2,1,2,0,2,2,2,0,2,2,0,2,2,0,0,0,0,0,0,0,0, 3,0,0,2,1,3,3,3,0,1,0,0,0,0,2,1,0,0,2,0,0,0,0,0,0,
3,3,3,3,3,3,3,2,2,2,3,2,3,1,3,2,0,2,1,3,2,3,3, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,0,2,3,1,2,2,0,3,3,2,
2,1,2,0,2,1,2,0,0,0,2,1,0,2,2,1,0,0,2,0,2,1,2, 2,3,3,1,1,3,0,3,2,0,2,2,2,0,2,0,2,1,0,2,0,2,2,0,2,
3,3,3,3,3,3,2,3,2,3,2,2,3,2,3,2,2,2,2,2,2,0,0, 3,3,3,3,3,3,3,3,3,2,3,3,3,3,3,2,3,3,2,3,3,1,0,3,
3,2,0,0,3,0,3,2,0,0,2,2,0,1,0,1,0,0,0,0,0,0,0, 3,1,3,0,1,3,2,1,2,1,0,0,1,0,1,0,0,2,0,2,0,1,0,0,0,
0,0,0,3,0,3,3,3,3,3,3,3,3,3,2,3,3,2,3,0,3,0,0, 3,3,3,3,3,3,3,3,2,3,2,3,3,3,1,3,3,2,3,3,2,3,3,3,
0,2,0,2,0,0,3,1,0,0,2,0,0,2,0,0,2,0,0,0,0,2,0, 3,3,2,2,0,2,1,2,1,0,2,1,0,0,1,0,0,1,2,1,1,1,1,0,0,
3,3,3,3,3,2,3,3,2,2,3,3,2,0,3,2,2,2,3,3,2,3,2, 3,3,3,3,3,3,3,3,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,
2,2,2,1,2,0,2,2,0,1,0,1,0,2,0,1,0,0,0,0,1,2,0, 2,3,3,1,0,3,0,2,3,3,2,0,0,0,2,0,0,1,0,1,0,0,0,0,0,
2,2,2,3,2,3,3,3,3,3,3,2,3,3,2,3,3,3,2,0,3,0,0, 3,3,3,3,3,2,3,3,3,3,3,3,3,3,3,3,1,3,3,3,3,1,0,0,
0,2,0,2,2,1,3,2,3,0,1,1,0,2,1,0,0,0,0,0,0,0,0, 3,0,2,2,2,3,3,2,0,3,1,0,0,0,3,0,1,0,0,0,0,2,0,0,0,
0,0,0,2,0,2,3,2,2,3,2,2,3,2,0,3,3,2,2,0,2,0,0, 0,0,0,3,3,0,3,3,3,2,3,3,2,0,2,3,0,2,1,3,3,0,0,0,
0,2,0,1,0,0,2,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0, 2,0,0,0,0,3,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,2,0,3,0,3,3,3,3,3,3,2,3,3,0,3,2,2,2,0,2,0,0, 1,2,0,3,3,1,3,3,3,3,3,3,3,0,3,3,0,3,3,3,3,0,0,0,
0,2,0,2,0,0,3,1,2,0,2,0,0,1,0,0,0,0,0,0,0,0,0, 3,0,0,2,1,3,3,2,0,3,0,0,0,0,1,0,1,0,1,0,0,0,0,0,0,
3,3,3,3,3,3,2,2,3,0,3,0,2,0,2,2,0,0,0,2,0,0,0, 3,3,3,3,1,3,3,3,3,3,1,2,0,3,0,2,2,1,0,0,0,0,0,3,
3,0,1,1,1,0,3,0,0,0,0,2,0,2,0,0,0,0,0,0,0,0,0, 0,0,1,0,0,3,0,1,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,
2,0,2,2,0,3,3,2,2,2,2,2,3,2,0,3,3,3,0,0,1,0,0, 0,2,1,3,3,0,2,3,3,3,2,3,3,1,2,3,0,3,1,1,3,0,0,0,
0,2,0,0,0,2,2,2,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0, 2,0,0,2,2,2,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,
3,3,3,3,3,0,1,2,2,1,2,3,0,0,3,0,0,0,1,0,2,0,0, 1,2,0,3,3,0,3,3,3,3,3,3,3,0,3,3,0,3,1,3,3,0,0,0,
3,0,2,0,0,0,2,0,0,0,0,0,0,2,0,0,2,0,0,0,0,0,0, 3,0,0,0,2,3,3,0,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
1,0,0,3,0,3,3,3,2,3,3,3,2,3,0,3,3,2,0,0,2,0,0, 3,3,3,3,3,3,3,2,3,3,2,2,2,3,0,0,3,3,2,2,0,3,0,1,
0,3,0,2,0,2,2,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,2,2,3,1,0,0,1,3,0,2,0,0,0,0,0,0,1,0,2,0,2,0,0,0,
3,3,3,2,3,2,3,1,2,1,2,0,2,0,3,0,0,1,0,2,0,3,0, 3,3,3,2,3,3,2,3,3,3,1,2,1,3,2,1,3,0,1,1,0,3,1,3,
2,0,2,0,1,2,1,2,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0, 1,3,1,2,3,1,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
3,3,3,3,3,3,0,2,2,2,3,1,2,3,2,0,0,2,0,1,2,0,0, 3,3,3,3,2,3,3,3,3,3,3,2,0,3,3,0,2,2,0,1,0,0,0,3,
3,2,1,0,1,0,2,0,2,0,2,0,0,1,0,0,0,0,0,0,0,0,0, 2,2,1,0,0,3,0,2,1,3,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,
3,3,3,2,3,2,3,2,0,2,3,2,2,1,3,1,0,2,1,2,0,2,0, 3,3,3,3,1,3,3,3,0,1,0,2,3,3,0,0,2,0,1,3,0,0,0,3,
0,0,2,0,2,0,0,2,0,0,0,2,0,0,1,0,0,0,0,0,2,0,0, 0,2,1,0,0,3,0,0,0,0,0,0,0,0,2,2,0,0,0,0,0,0,0,0,0,
3,3,0,0,1,0,2,0,1,0,0,2,0,1,2,0,0,0,0,2,0,0,0, 3,3,2,3,1,0,3,3,2,0,2,3,1,3,0,1,0,1,1,3,0,0,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 1,0,3,2,1,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,2,3,3,3,3,3,2,1,0,0,2,2,0,0,0,2,0,0, 0,0,0,3,3,1,2,1,3,2,1,3,3,0,3,2,0,1,2,3,3,0,0,0,
0,0,0,3,0,0,1,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,3,2,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
3,3,0,3,0,0,0,2,3,2,0,0,2,0,3,0,1,1,0,0,2,0,0, 3,3,0,1,2,2,0,1,1,0,0,1,2,2,0,0,1,1,0,1,0,0,0,0,
0,2,0,0,2,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,3,0,2,3,2,1,1,2,3,3,3,0,1,2,0,0,0,3,0,0, 3,3,3,2,3,3,3,1,2,2,0,1,1,1,0,1,0,2,0,1,0,2,0,1,
0,0,0,1,0,1,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,1,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,2,0,0,0,0,0,
2,2,2,2,3,3,0,0,1,0,2,0,2,2,2,0,0,1,0,0,0,1,0, 0,0,0,0,3,0,3,2,2,3,3,2,3,0,1,2,0,1,2,3,3,0,0,0,
1,0,0,0,0,2,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0, 1,0,0,0,0,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
3,3,0,0,0,0,0,0,0,0,0,1,2,0,2,0,0,2,0,2,0,0,0, 0,1,0,2,2,1,2,2,3,0,1,0,2,0,0,1,0,1,0,1,3,0,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 3,0,0,1,0,0,0,0,0,3,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,
2,2,2,1,3,2,0,2,1,0,2,0,1,0,0,0,0,2,0,0,1,1,0, 3,2,3,2,0,3,0,2,3,0,2,1,0,2,3,0,0,0,0,0,0,2,0,1,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0, 0,0,0,0,2,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,2,0,2,1,0,1,0,0,2,0,0,0,2,2,0,0,0,2,0,0, 3,3,0,0,0,0,1,0,0,0,0,2,1,3,0,0,2,0,0,0,0,0,0,0,
0,3,0,0,0,0,0,2,2,0,0,0,0,0,0,2,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
2,3,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0, 3,3,0,0,0,0,2,0,0,0,0,2,0,3,0,0,1,0,0,0,0,0,0,0,
0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,2,0,0,1,0,0,0,0,2,0,0,0,0,2,0,0,0, 1,0,2,0,0,2,0,0,0,0,1,0,0,3,0,0,0,0,0,1,0,1,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,2,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,2,0,0, 0,0,0,1,2,0,2,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,2,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,2,0,2,2,0,2,0,2,0,1,0,0,1,2,0,2,0,0,0,0, 0,1,2,0,0,2,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,3,
0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,2,0,2,2,2,0,0,2,2,2,0,0,0,0,2,0,0,1,0,0, 0,0,2,2,2,1,1,1,2,2,0,0,1,0,0,2,0,1,0,2,1,0,0,0,
0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,
0,0,2,0,2,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0, 0,0,0,1,2,0,1,3,2,1,0,1,1,0,2,2,0,1,1,0,1,0,0,0,
2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,
0,0,0,0,0,2,0,0,0,0,0,0,1,0,0,0,0,2,0,0,0,0,0, 0,0,0,2,2,0,1,1,2,1,0,2,0,0,1,1,0,1,0,1,0,0,0,0,
0,0,0,0,0,0,2,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0, 0,0,0,1,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,2,0,0,0,0,
0,0,0,0,0,0,3,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,
2,2,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,1,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,
0,0,0,0,0,2,1,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,
}; };
@ -272,8 +280,8 @@ const SequenceModel Iso_8859_2SlovakModel =
{ {
Iso_8859_2_CharToOrderMap, Iso_8859_2_CharToOrderMap,
SlovakLangModel, SlovakLangModel,
46, 49,
(float)0.9724967373205526, (float)0.9990023779906511,
PR_TRUE, PR_TRUE,
"ISO-8859-2", "ISO-8859-2",
"sk" "sk"
@ -283,8 +291,8 @@ const SequenceModel Windows_1250SlovakModel =
{ {
Windows_1250_CharToOrderMap, Windows_1250_CharToOrderMap,
SlovakLangModel, SlovakLangModel,
46, 49,
(float)0.9724967373205526, (float)0.9990023779906511,
PR_TRUE, PR_TRUE,
"WINDOWS-1250", "WINDOWS-1250",
"sk" "sk"
@ -294,8 +302,8 @@ const SequenceModel Ibm852SlovakModel =
{ {
Ibm852_CharToOrderMap, Ibm852_CharToOrderMap,
SlovakLangModel, SlovakLangModel,
46, 49,
(float)0.9724967373205526, (float)0.9990023779906511,
PR_TRUE, PR_TRUE,
"IBM852", "IBM852",
"sk" "sk"
@ -305,8 +313,8 @@ const SequenceModel Mac_CentraleuropeSlovakModel =
{ {
Mac_Centraleurope_CharToOrderMap, Mac_Centraleurope_CharToOrderMap,
SlovakLangModel, SlovakLangModel,
46, 49,
(float)0.9724967373205526, (float)0.9990023779906511,
PR_TRUE, PR_TRUE,
"MAC-CENTRALEUROPE", "MAC-CENTRALEUROPE",
"sk" "sk"
@ -316,8 +324,8 @@ const LanguageModel SlovakModel =
{ {
"sk", "sk",
Unicode_CharOrder, Unicode_CharOrder,
92, 98,
SlovakLangModel, SlovakLangModel,
46, 49,
(float)0.9724967373205526, (float)0.9998118217433309,
}; };

View File

@ -42,7 +42,7 @@
/** /**
* Generated by BuildLangModel.py * Generated by BuildLangModel.py
* On: 2021-03-16 20:20:05.416974 * On: 2021-03-21 12:38:56.631590
**/ **/
/* Character Mapping Table: /* Character Mapping Table:
@ -68,18 +68,18 @@ static const unsigned char Iso_8859_2_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 4X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 4X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,SYM, /* 5X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 6X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 6X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,CTR, /* 7X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 8X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 8X */
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 9X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 9X */
SYM, 41,SYM, 42,SYM, 43, 44,SYM,SYM, 22, 45, 46, 47,SYM, 23, 48, /* AX */ SYM, 57,SYM, 48,SYM, 58, 59,SYM,SYM, 22, 60, 61, 62,SYM, 23, 63, /* AX */
SYM, 49,SYM, 50,SYM, 51, 52,SYM,SYM, 22, 53, 54, 55,SYM, 23, 56, /* BX */ SYM, 64,SYM, 48,SYM, 65, 66,SYM,SYM, 22, 67, 68, 69,SYM, 23, 70, /* BX */
57, 33, 58, 59, 60, 61, 62, 31, 21, 29, 63, 37, 64, 30, 65, 66, /* CX */ 71, 34, 72, 73, 33, 74, 30, 45, 20, 29, 75, 46, 76, 37, 51, 77, /* CX */
67, 68, 69, 32, 36, 70, 71,SYM, 72, 73, 39, 74, 75, 40, 76, 77, /* DX */ 35, 53, 78, 36, 49, 79, 31,SYM, 41, 80, 81, 82, 28, 43, 83, 44, /* DX */
78, 33, 79, 80, 81, 82, 83, 31, 21, 29, 84, 37, 85, 30, 86, 87, /* EX */ 84, 34, 85, 86, 33, 87, 30, 45, 20, 29, 88, 46, 89, 37, 51, 90, /* EX */
88, 89, 90, 32, 36, 91, 92,SYM, 93, 94, 39, 95, 96, 40, 97,SYM, /* FX */ 35, 53, 91, 36, 49, 92, 31,SYM, 41, 93, 94, 95, 28, 43, 96,SYM, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
@ -89,18 +89,18 @@ static const unsigned char Iso_8859_16_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 4X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 4X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,SYM, /* 5X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 6X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 6X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,CTR, /* 7X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 8X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 8X */
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 9X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 9X */
SYM, 98, 99,100,SYM,SYM, 22,SYM, 22,SYM,101,SYM,102,SYM,103,104, /* AX */ SYM, 97, 98, 48,SYM,SYM, 22,SYM, 22,SYM, 99,SYM,100,SYM,101,102, /* AX */
SYM,SYM, 21,105, 23,SYM,SYM,SYM, 23, 21,106,SYM,107,108,109,110, /* BX */ SYM,SYM, 20, 48, 23,SYM,SYM,SYM, 23, 20,103,SYM, 52, 52,104,105, /* BX */
111, 33,112,113,114,115,116, 31, 35, 29, 34, 37,117, 30,118,119, /* CX */ 39, 34,106,107, 33, 30, 47, 45, 38, 29,108, 46, 50, 37, 51,109, /* CX */
120,121,122, 32, 36,123,124,125,126,127, 39,128,129,130,131,132, /* DX */ 35, 53, 56, 36, 49,110, 31,111,112, 54,113, 55, 28,114,115, 44, /* DX */
133, 33,134,135,136,137,138, 31, 35, 29, 34, 37,139, 30,140,141, /* EX */ 39, 34,116,117, 33, 30, 47, 45, 38, 29,118, 46, 50, 37, 51,119, /* EX */
142,143,144, 32, 36,145,146,147,148,149, 39,150,151,152,153,154, /* FX */ 35, 53, 56, 36, 49,120, 31,121,122, 54,123, 55, 28,124,125,126, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
@ -110,18 +110,18 @@ static const unsigned char Windows_1250_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 4X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 4X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,SYM, /* 5X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 6X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 6X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,CTR, /* 7X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */
SYM,ILL,SYM,ILL,SYM,SYM,SYM,SYM,ILL,SYM, 22,SYM,155,156, 23,157, /* 8X */ SYM,ILL,SYM,ILL,SYM,SYM,SYM,SYM,ILL,SYM, 22,SYM,127,128, 23,129, /* 8X */
ILL,SYM,SYM,SYM,SYM,SYM,SYM,SYM,ILL,SYM, 22,SYM,158,159, 23,160, /* 9X */ ILL,SYM,SYM,SYM,SYM,SYM,SYM,SYM,ILL,SYM, 22,SYM,130,131, 23,132, /* 9X */
SYM,SYM,SYM,161,SYM,162,SYM,SYM,SYM,SYM,163,SYM,SYM,SYM,SYM,164, /* AX */ SYM,SYM,SYM, 48,SYM,133,SYM,SYM,SYM,SYM,134,SYM,SYM,SYM,SYM,135, /* AX */
SYM,SYM,SYM,165,SYM,SYM,SYM,SYM,SYM,166,167,SYM,168,SYM,169,170, /* BX */ SYM,SYM,SYM, 48,SYM,SYM,SYM,SYM,SYM,136,137,SYM,138,SYM,139,140, /* BX */
171, 33,172,173,174,175,176, 31, 21, 29,177, 37,178, 30,179,180, /* CX */ 141, 34,142,143, 33,144, 30, 45, 20, 29,145, 46,146, 37, 51,147, /* CX */
181,182,183, 32, 36,184,185,SYM,186,187, 39,188,189, 40,190,191, /* DX */ 35, 53,148, 36, 49,149, 31,SYM, 41,150,151,152, 28, 43,153, 44, /* DX */
192, 33,193,194,195,196,197, 31, 21, 29,198, 37,199, 30,200,201, /* EX */ 154, 34,155,156, 33,157, 30, 45, 20, 29,158, 46,159, 37, 51,160, /* EX */
202,203,204, 32, 36,205,206,SYM,207,208, 39,209,210, 40,211,SYM, /* FX */ 35, 53,161, 36, 49,162, 31,SYM, 41,163,164,165, 28, 43,166,SYM, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
@ -131,18 +131,18 @@ static const unsigned char Ibm852_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 4X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 4X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,SYM, /* 5X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 6X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 6X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,CTR, /* 7X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */
31,212, 29,213,214,215,216, 31,217, 37,218,219,220,221,222,223, /* 8X */ 45, 28, 29,167, 33,168, 30, 45, 48, 46,169,170, 51,171, 33, 30, /* 8X */
29,224,225, 36,226,227,228,229,230,231,232,233,234,235,SYM, 21, /* 9X */ 29,172,173, 49, 31,174,175,176,177, 31, 28,178,179, 48,SYM, 20, /* 9X */
33, 30, 32, 39,236,237, 23, 23,238,239,SYM,240, 21,241,SYM,SYM, /* AX */ 34, 37, 36,180,181,182, 23, 23,183,184,SYM,185, 20,186,SYM,SYM, /* AX */
SYM,SYM,SYM,SYM,SYM, 33,242,243,244,SYM,SYM,SYM,SYM,245,246,SYM, /* BX */ SYM,SYM,SYM,SYM,SYM, 34,187,188,189,SYM,SYM,SYM,SYM,190,191,SYM, /* BX */
SYM,SYM,SYM,SYM,SYM,SYM,247,248,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* CX */ SYM,SYM,SYM,SYM,SYM,SYM,192,193,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* CX */
249,249,249, 37,249,249, 30,249,249,SYM,SYM,SYM,SYM,249,249,SYM, /* DX */ 35, 35,194, 46,195,196, 37, 51,197,SYM,SYM,SYM,SYM,198,199,SYM, /* DX */
32,249, 36,249,249,249, 22, 22,249, 39,249,249, 40, 40,249,SYM, /* EX */ 36, 44, 49, 53, 53,200, 22, 22,201,202,203,204, 43, 43,205,SYM, /* EX */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,249,249,249,SYM,SYM, /* FX */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,206, 41, 41,SYM,SYM, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
@ -152,73 +152,69 @@ static const unsigned char Mac_Centraleurope_CharToOrderMap[] =
CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */ CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR,CTR, /* 1X */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM, /* 2X */
NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */ NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,NUM,SYM,SYM,SYM,SYM,SYM,SYM, /* 3X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 4X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 4X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,SYM, /* 5X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,SYM, /* 5X */
SYM, 0, 18, 19, 13, 1, 24, 17, 20, 2, 9, 12, 8, 14, 4, 3, /* 6X */ SYM, 1, 17, 21, 12, 0, 24, 18, 19, 2, 9, 11, 7, 14, 4, 3, /* 6X */
11, 28, 5, 6, 7, 16, 10, 25, 27, 26, 15,SYM,SYM,SYM,SYM,CTR, /* 7X */ 13, 32, 5, 6, 8, 15, 10, 25, 27, 26, 16,SYM,SYM,SYM,SYM,CTR, /* 7X */
249,249,249, 29,249,249,249, 33,249, 21,249, 21,249,249, 29,249, /* 8X */ 33, 42, 42, 29,207, 31, 28, 34,208, 20, 33, 20, 30, 30, 29,209, /* 8X */
249,249, 30,249, 38, 38,249, 32,249, 36,249,249, 39,249,249,249, /* 9X */ 210,211, 37,212, 40, 40,213, 36,214, 49, 31,215,216,217,218, 28, /* 9X */
SYM,SYM,249,SYM,SYM,SYM,SYM,249,SYM,SYM,SYM,249,SYM,SYM,249,249, /* AX */ SYM,SYM,219,SYM,SYM,SYM,SYM, 44,SYM,SYM,SYM,220,SYM,SYM,221,222, /* AX */
249,249,SYM,SYM,249,249,SYM,SYM,249,249,249,249,249,249,249,249, /* BX */ 223,224,SYM,SYM,225,226,SYM,SYM, 48,227,228,229,230,231,232,233, /* BX */
249,249,SYM,SYM,249,249,SYM,SYM,SYM,SYM,SYM,249,249,249,249,249, /* CX */ 234, 53,SYM,SYM, 53,235,SYM,SYM,SYM,SYM,SYM,236,237,238,239,240, /* CX */
SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,249,249,249,249,SYM,SYM,249,249, /* DX */ SYM,SYM,SYM,SYM,SYM,SYM,SYM,SYM,241,242,243, 41,SYM,SYM, 41,244, /* DX */
249, 22,SYM,SYM, 22,249,249, 33,249,249, 30, 23, 23,249, 32, 36, /* EX */ 245, 22,SYM,SYM, 22,246,247, 34,248,249, 37, 23, 23,249, 36, 49, /* EX */
249,249, 39,249,249,249,249,249, 40, 40,249,249,249,249,249,SYM, /* FX */ 249,249,249,249,249,249,249,249, 43, 43,249,249, 48,249,249,SYM, /* FX */
}; };
/*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */ /*X0 X1 X2 X3 X4 X5 X6 X7 X8 X9 XA XB XC XD XE XF */
static const int Unicode_Char_size = 58; static const int Unicode_Char_size = 50;
static const unsigned int Unicode_CharOrder[] = static const unsigned int Unicode_CharOrder[] =
{ {
65, 0, 66, 18, 67, 19, 68, 13, 69, 1, 70, 24, 71, 17, 72, 20, 65, 1, 66, 17, 67, 21, 68, 12, 69, 0, 70, 24, 71, 18, 72, 19,
73, 2, 74, 9, 75, 12, 76, 8, 77, 14, 78, 4, 79, 3, 80, 11, 73, 2, 74, 9, 75, 11, 76, 7, 77, 14, 78, 4, 79, 3, 80, 13,
81, 28, 82, 5, 83, 6, 84, 7, 85, 16, 86, 10, 87, 25, 88, 27, 82, 5, 83, 6, 84, 8, 85, 15, 86, 10, 90, 16, 97, 1, 98, 17,
89, 26, 90, 15, 97, 0, 98, 18, 99, 19, 100, 13, 101, 1,102, 24, 99, 21, 100, 12, 101, 0, 102, 24, 103, 18, 104, 19, 105, 2,106, 9,
103, 17, 104, 20, 105, 2, 106, 9, 107, 12, 108, 8, 109, 14,110, 4, 107, 11, 108, 7, 109, 14, 110, 4, 111, 3, 112, 13, 114, 5,115, 6,
111, 3, 112, 11, 113, 28, 114, 5, 115, 6, 116, 7, 117, 16,118, 10, 116, 8, 117, 15, 118, 10, 122, 16, 268, 20, 269, 20, 352, 22,353, 22,
119, 25, 120, 27, 121, 26, 122, 15, 268, 21, 269, 21, 352, 22,353, 22,
381, 23, 382, 23, 381, 23, 382, 23,
}; };
/* Model Table: /* Model Table:
* Total sequences: 698 * Total considered sequences: 880 / 625
* First 512 sequences: 0.998296272473889 * - Positive sequences: first 449 (0.9950499684040537)
* Next 512 sequences (512-1024): 0.00170372752611106 * - Probable sequences: next 172 (621-449) (0.003957684836286113)
* Rest: -2.8189256484623115e-17 * - Neutral sequences: last 4 (0.000992346759660201)
* - Negative sequences: -255 (off-ratio)
* Negative sequences: TODO * Negative sequences: TODO
*/ */
static const PRUint8 SloveneLangModel[] = static const PRUint8 SloveneLangModel[] =
{ {
2,3,3,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2, 3,3,3,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,0,0,3,2, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,0, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,3,2,3,2,0, 3,3,3,3,3,2,3,2,3,3,3,3,3,3,2,3,3,3,3,3,3,3,3,2,3,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,0,2, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,
3,3,3,3,3,3,3,3,3,2,3,3,3,3,3,2,3,2,3,3,3,2,2,0,3,3,3,2,2, 3,3,3,3,3,3,3,3,3,2,3,3,1,3,3,3,2,3,2,3,2,3,1,1,2,
3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,3,3,2,3,3,3,0,2,0,3,3,3,3,0, 3,3,3,3,3,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,2,3,3,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,3,2,3,0,3,3,2,3,0,0, 3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,3,3,2,2,3,0,3,0,0,1,
3,3,3,3,3,2,3,3,0,0,3,3,3,3,3,3,3,2,3,3,3,2,3,0,0,0,0,0,0, 3,3,3,3,3,3,3,2,3,1,3,3,3,3,3,3,2,3,1,3,2,3,3,0,1,
3,3,3,3,3,3,3,3,3,3,0,3,3,3,3,3,3,3,2,3,3,3,3,2,2,0,2,2,0, 3,3,3,3,3,3,3,3,3,3,0,3,3,3,2,3,3,3,3,2,3,3,3,2,0,
3,3,3,3,3,3,3,3,3,0,0,3,3,3,3,0,3,3,2,3,3,2,2,0,0,0,3,2,0, 3,3,3,3,3,3,3,3,3,3,3,2,3,2,3,3,0,1,1,2,0,3,2,0,2,
3,3,3,3,3,3,3,3,3,3,3,2,0,2,3,0,3,2,2,3,3,0,3,0,0,2,3,0,0, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,2,3,3,3,2,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,2,2,2,3,2,0, 3,3,3,3,3,3,3,3,3,2,1,2,1,2,1,3,2,1,1,3,2,2,2,0,2,
3,3,3,3,3,3,3,3,3,3,2,3,3,3,3,0,3,2,3,3,3,2,2,0,2,3,3,2,0, 3,3,3,3,3,3,3,3,2,1,3,3,2,3,3,3,1,3,1,1,3,3,3,1,2,
3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,2,3,2,3,2,0,0,2,2,0, 3,3,3,2,3,3,3,3,3,3,3,3,3,3,3,1,3,3,3,3,3,3,3,3,2,
3,3,3,2,3,3,3,3,3,3,3,3,3,3,3,3,0,3,3,3,3,3,3,3,3,0,2,3,0, 3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,1,2,3,1,1,
3,3,3,3,3,3,3,2,3,0,3,3,0,0,2,2,3,3,3,2,3,0,0,0,0,0,2,2,0, 3,3,3,3,3,3,3,3,3,3,3,2,3,1,3,3,3,2,2,1,3,2,2,0,0,
3,3,3,3,3,3,3,3,3,3,3,2,2,3,3,0,3,0,3,3,0,3,2,2,2,0,3,0,0, 3,3,3,3,3,3,2,3,2,1,2,2,2,1,2,3,0,2,2,3,0,1,0,0,0,
3,3,3,3,2,3,3,3,3,0,2,3,3,3,2,2,3,2,3,3,3,0,0,0,2,2,2,2,2, 3,3,3,3,3,3,2,3,3,0,1,3,2,1,3,3,0,2,2,0,2,0,0,0,2,
3,3,3,3,3,3,2,3,3,0,3,2,3,3,2,3,3,0,2,0,0,2,0,0,2,2,2,0,0, 3,3,3,3,3,3,1,3,1,3,3,3,0,0,1,3,0,2,0,0,0,1,0,0,0,
3,3,3,3,3,3,0,2,3,3,2,2,3,2,0,0,3,0,2,2,0,0,0,0,0,0,0,0,0, 3,3,3,3,2,3,2,3,3,1,3,3,1,0,2,3,1,1,1,3,0,3,0,0,2,
3,3,3,3,3,2,0,3,3,3,2,3,3,0,0,0,3,0,0,0,0,3,0,0,0,0,0,0,0, 3,3,3,3,3,2,0,3,3,3,3,3,1,3,2,3,0,0,0,0,3,2,1,0,0,
3,3,3,2,3,2,0,0,2,3,2,0,3,0,0,0,2,2,3,0,0,0,0,0,0,0,0,0,0, 3,3,3,3,3,2,0,0,0,3,1,2,0,0,1,3,0,3,2,0,0,1,0,0,0,
3,3,3,3,2,3,3,3,3,2,0,0,0,0,2,0,3,2,0,0,0,0,0,0,3,2,0,0,0, 3,3,3,3,2,3,3,3,2,2,0,1,0,0,2,3,0,2,2,0,0,0,0,0,3,
3,3,3,3,3,0,3,2,2,0,0,0,0,2,0,0,2,2,2,0,2,0,0,0,0,3,2,0,0,
2,3,2,3,3,2,3,2,3,3,0,2,2,2,3,0,2,2,2,3,2,0,0,0,0,2,0,0,0,
3,2,3,3,0,2,2,3,0,0,2,3,0,2,2,0,3,2,3,3,0,0,0,0,0,2,2,3,0,
0,0,2,2,0,0,0,0,0,0,0,0,0,0,0,0,3,0,0,0,0,0,0,0,0,0,0,0,0,
}; };
@ -226,9 +222,9 @@ const SequenceModel Iso_8859_2SloveneModel =
{ {
Iso_8859_2_CharToOrderMap, Iso_8859_2_CharToOrderMap,
SloveneLangModel, SloveneLangModel,
29, 25,
(float)0.998296272473889, (float)0.9990076532403398,
PR_TRUE, PR_FALSE,
"ISO-8859-2", "ISO-8859-2",
"sl" "sl"
}; };
@ -237,9 +233,9 @@ const SequenceModel Iso_8859_16SloveneModel =
{ {
Iso_8859_16_CharToOrderMap, Iso_8859_16_CharToOrderMap,
SloveneLangModel, SloveneLangModel,
29, 25,
(float)0.998296272473889, (float)0.9990076532403398,
PR_TRUE, PR_FALSE,
"ISO-8859-16", "ISO-8859-16",
"sl" "sl"
}; };
@ -248,9 +244,9 @@ const SequenceModel Windows_1250SloveneModel =
{ {
Windows_1250_CharToOrderMap, Windows_1250_CharToOrderMap,
SloveneLangModel, SloveneLangModel,
29, 25,
(float)0.998296272473889, (float)0.9990076532403398,
PR_TRUE, PR_FALSE,
"WINDOWS-1250", "WINDOWS-1250",
"sl" "sl"
}; };
@ -259,9 +255,9 @@ const SequenceModel Ibm852SloveneModel =
{ {
Ibm852_CharToOrderMap, Ibm852_CharToOrderMap,
SloveneLangModel, SloveneLangModel,
29, 25,
(float)0.998296272473889, (float)0.9990076532403398,
PR_TRUE, PR_FALSE,
"IBM852", "IBM852",
"sl" "sl"
}; };
@ -270,9 +266,9 @@ const SequenceModel Mac_CentraleuropeSloveneModel =
{ {
Mac_Centraleurope_CharToOrderMap, Mac_Centraleurope_CharToOrderMap,
SloveneLangModel, SloveneLangModel,
29, 25,
(float)0.998296272473889, (float)0.9990076532403398,
PR_TRUE, PR_FALSE,
"MAC-CENTRALEUROPE", "MAC-CENTRALEUROPE",
"sl" "sl"
}; };
@ -281,8 +277,8 @@ const LanguageModel SloveneModel =
{ {
"sl", "sl",
Unicode_CharOrder, Unicode_CharOrder,
58, 50,
SloveneLangModel, SloveneLangModel,
29, 25,
(float)0.998296272473889, (float)0.9976974938105708,
}; };