cchardet 0.2.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/.gitignore +8 -0
- data/.gitmodules +3 -0
- data/.rubocop.yml +11 -0
- data/CHANGELOG.md +5 -0
- data/Gemfile +10 -0
- data/README.md +35 -0
- data/Rakefile +15 -0
- data/cchardet.gemspec +30 -0
- data/ext/cchardet/extconf.rb +26 -0
- data/ext/uchardet/.gitignore +1 -0
- data/ext/uchardet/.gitlab-ci.yml +106 -0
- data/ext/uchardet/AUTHORS +16 -0
- data/ext/uchardet/CMakeLists.txt +74 -0
- data/ext/uchardet/COPYING +1316 -0
- data/ext/uchardet/INSTALL +26 -0
- data/ext/uchardet/README.md +295 -0
- data/ext/uchardet/build-mac/uchardet.cpp +7 -0
- data/ext/uchardet/build-mac/uchardet.xcodeproj/project.pbxproj +543 -0
- data/ext/uchardet/build-mac/uchardet.xcodeproj/project.xcworkspace/contents.xcworkspacedata +7 -0
- data/ext/uchardet/build-mac/uchardet.xcodeproj/project.xcworkspace/xcshareddata/uchardet.xccheckout +41 -0
- data/ext/uchardet/build-mac/uchardet.xcodeproj/xcshareddata/xcschemes/uchardet-ios.xcscheme +77 -0
- data/ext/uchardet/build-mac/uchardet.xcodeproj/xcshareddata/xcschemes/uchardet.xcscheme +77 -0
- data/ext/uchardet/doc/CMakeLists.txt +6 -0
- data/ext/uchardet/doc/README.maintainer +59 -0
- data/ext/uchardet/doc/uchardet.1 +18 -0
- data/ext/uchardet/script/BuildLangModel.py +533 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangArabicModel.log +142 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangCroatianModel.log +157 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangCzechModel.log +161 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangDanishModel.log +158 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangEsperantoModel.log +110 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangEstonianModel.log +159 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangFinnishModel.log +156 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangFrenchModel.log +116 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangGermanModel.log +159 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangGreekModel.log +272 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangHungarianModel.log +109 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangIrishModel.log +156 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangItalianModel.log +162 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangLatvianModel.log +162 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangLithuanianModel.log +162 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangMalteseModel.log +147 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangPolishModel.log +154 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangPortugueseModel.log +166 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangRomanianModel.log +153 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangSlovakModel.log +158 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangSloveneModel.log +148 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangSpanishModel.log +109 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangSwedishModel.log +151 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangThaiModel.log +141 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangTurkishModel.log +113 -0
- data/ext/uchardet/script/BuildLangModelLogs/LangVietnameseModel.log +121 -0
- data/ext/uchardet/script/README +63 -0
- data/ext/uchardet/script/charsets/codepoints.py +53 -0
- data/ext/uchardet/script/charsets/db.py +73 -0
- data/ext/uchardet/script/charsets/ibm852.py +72 -0
- data/ext/uchardet/script/charsets/iso-8859-1.py +85 -0
- data/ext/uchardet/script/charsets/iso-8859-10.py +73 -0
- data/ext/uchardet/script/charsets/iso-8859-11.py +77 -0
- data/ext/uchardet/script/charsets/iso-8859-13.py +72 -0
- data/ext/uchardet/script/charsets/iso-8859-15.py +80 -0
- data/ext/uchardet/script/charsets/iso-8859-16.py +83 -0
- data/ext/uchardet/script/charsets/iso-8859-2.py +73 -0
- data/ext/uchardet/script/charsets/iso-8859-3.py +75 -0
- data/ext/uchardet/script/charsets/iso-8859-4.py +73 -0
- data/ext/uchardet/script/charsets/iso-8859-6.py +73 -0
- data/ext/uchardet/script/charsets/iso-8859-7.py +73 -0
- data/ext/uchardet/script/charsets/iso-8859-9.py +76 -0
- data/ext/uchardet/script/charsets/mac-centraleurope.py +72 -0
- data/ext/uchardet/script/charsets/tis-620.py +77 -0
- data/ext/uchardet/script/charsets/viscii.py +72 -0
- data/ext/uchardet/script/charsets/windows-1250.py +75 -0
- data/ext/uchardet/script/charsets/windows-1252.py +76 -0
- data/ext/uchardet/script/charsets/windows-1253.py +72 -0
- data/ext/uchardet/script/charsets/windows-1256.py +75 -0
- data/ext/uchardet/script/charsets/windows-1257.py +72 -0
- data/ext/uchardet/script/charsets/windows-1258.py +72 -0
- data/ext/uchardet/script/debug.sh +9 -0
- data/ext/uchardet/script/header-template.cpp +38 -0
- data/ext/uchardet/script/langs/ar.py +59 -0
- data/ext/uchardet/script/langs/cs.py +80 -0
- data/ext/uchardet/script/langs/da.py +69 -0
- data/ext/uchardet/script/langs/de.py +69 -0
- data/ext/uchardet/script/langs/el.py +55 -0
- data/ext/uchardet/script/langs/eo.py +67 -0
- data/ext/uchardet/script/langs/es.py +69 -0
- data/ext/uchardet/script/langs/et.py +57 -0
- data/ext/uchardet/script/langs/fi.py +60 -0
- data/ext/uchardet/script/langs/fr.py +79 -0
- data/ext/uchardet/script/langs/ga.py +60 -0
- data/ext/uchardet/script/langs/hr.py +59 -0
- data/ext/uchardet/script/langs/hu.py +66 -0
- data/ext/uchardet/script/langs/it.py +56 -0
- data/ext/uchardet/script/langs/lt.py +70 -0
- data/ext/uchardet/script/langs/lv.py +69 -0
- data/ext/uchardet/script/langs/mt.py +80 -0
- data/ext/uchardet/script/langs/pl.py +81 -0
- data/ext/uchardet/script/langs/pt.py +80 -0
- data/ext/uchardet/script/langs/ro.py +65 -0
- data/ext/uchardet/script/langs/sk.py +80 -0
- data/ext/uchardet/script/langs/sl.py +59 -0
- data/ext/uchardet/script/langs/sv.py +56 -0
- data/ext/uchardet/script/langs/th.py +55 -0
- data/ext/uchardet/script/langs/tr.py +67 -0
- data/ext/uchardet/script/langs/vi.py +64 -0
- data/ext/uchardet/script/release.sh +8 -0
- data/ext/uchardet/script/win32.sh +7 -0
- data/ext/uchardet/src/Big5Freq.tab +943 -0
- data/ext/uchardet/src/CMakeLists.txt +160 -0
- data/ext/uchardet/src/CharDistribution.cpp +109 -0
- data/ext/uchardet/src/CharDistribution.h +242 -0
- data/ext/uchardet/src/EUCKRFreq.tab +614 -0
- data/ext/uchardet/src/EUCTWFreq.tab +447 -0
- data/ext/uchardet/src/GB2312Freq.tab +491 -0
- data/ext/uchardet/src/JISFreq.tab +589 -0
- data/ext/uchardet/src/JpCntx.cpp +230 -0
- data/ext/uchardet/src/JpCntx.h +140 -0
- data/ext/uchardet/src/LangModels/LangArabicModel.cpp +267 -0
- data/ext/uchardet/src/LangModels/LangBulgarianModel.cpp +249 -0
- data/ext/uchardet/src/LangModels/LangCroatianModel.cpp +298 -0
- data/ext/uchardet/src/LangModels/LangCzechModel.cpp +285 -0
- data/ext/uchardet/src/LangModels/LangDanishModel.cpp +201 -0
- data/ext/uchardet/src/LangModels/LangEsperantoModel.cpp +142 -0
- data/ext/uchardet/src/LangModels/LangEstonianModel.cpp +268 -0
- data/ext/uchardet/src/LangModels/LangFinnishModel.cpp +297 -0
- data/ext/uchardet/src/LangModels/LangFrenchModel.cpp +209 -0
- data/ext/uchardet/src/LangModels/LangGermanModel.cpp +170 -0
- data/ext/uchardet/src/LangModels/LangGreekModel.cpp +231 -0
- data/ext/uchardet/src/LangModels/LangHebrewModel.cpp +220 -0
- data/ext/uchardet/src/LangModels/LangHungarianModel.cpp +171 -0
- data/ext/uchardet/src/LangModels/LangIrishModel.cpp +234 -0
- data/ext/uchardet/src/LangModels/LangItalianModel.cpp +269 -0
- data/ext/uchardet/src/LangModels/LangLatvianModel.cpp +210 -0
- data/ext/uchardet/src/LangModels/LangLithuanianModel.cpp +209 -0
- data/ext/uchardet/src/LangModels/LangMalteseModel.cpp +138 -0
- data/ext/uchardet/src/LangModels/LangPolishModel.cpp +304 -0
- data/ext/uchardet/src/LangModels/LangPortugueseModel.cpp +241 -0
- data/ext/uchardet/src/LangModels/LangRomanianModel.cpp +236 -0
- data/ext/uchardet/src/LangModels/LangRussianModel.cpp +367 -0
- data/ext/uchardet/src/LangModels/LangSlovakModel.cpp +293 -0
- data/ext/uchardet/src/LangModels/LangSloveneModel.cpp +264 -0
- data/ext/uchardet/src/LangModels/LangSpanishModel.cpp +204 -0
- data/ext/uchardet/src/LangModels/LangSwedishModel.cpp +266 -0
- data/ext/uchardet/src/LangModels/LangThaiModel.cpp +267 -0
- data/ext/uchardet/src/LangModels/LangTurkishModel.cpp +175 -0
- data/ext/uchardet/src/LangModels/LangVietnameseModel.cpp +249 -0
- data/ext/uchardet/src/nsBig5Prober.cpp +88 -0
- data/ext/uchardet/src/nsBig5Prober.h +75 -0
- data/ext/uchardet/src/nsCharSetProber.cpp +125 -0
- data/ext/uchardet/src/nsCharSetProber.h +77 -0
- data/ext/uchardet/src/nsCodingStateMachine.h +105 -0
- data/ext/uchardet/src/nsEUCJPProber.cpp +99 -0
- data/ext/uchardet/src/nsEUCJPProber.h +79 -0
- data/ext/uchardet/src/nsEUCKRProber.cpp +91 -0
- data/ext/uchardet/src/nsEUCKRProber.h +81 -0
- data/ext/uchardet/src/nsEUCTWProber.cpp +91 -0
- data/ext/uchardet/src/nsEUCTWProber.h +75 -0
- data/ext/uchardet/src/nsEscCharsetProber.cpp +101 -0
- data/ext/uchardet/src/nsEscCharsetProber.h +70 -0
- data/ext/uchardet/src/nsEscSM.cpp +267 -0
- data/ext/uchardet/src/nsGB2312Prober.cpp +96 -0
- data/ext/uchardet/src/nsGB2312Prober.h +77 -0
- data/ext/uchardet/src/nsHebrewProber.cpp +194 -0
- data/ext/uchardet/src/nsHebrewProber.h +177 -0
- data/ext/uchardet/src/nsLatin1Prober.cpp +182 -0
- data/ext/uchardet/src/nsLatin1Prober.h +73 -0
- data/ext/uchardet/src/nsMBCSGroupProber.cpp +242 -0
- data/ext/uchardet/src/nsMBCSGroupProber.h +81 -0
- data/ext/uchardet/src/nsMBCSSM.cpp +513 -0
- data/ext/uchardet/src/nsPkgInt.h +89 -0
- data/ext/uchardet/src/nsSBCSGroupProber.cpp +343 -0
- data/ext/uchardet/src/nsSBCSGroupProber.h +71 -0
- data/ext/uchardet/src/nsSBCharSetProber.cpp +160 -0
- data/ext/uchardet/src/nsSBCharSetProber.h +258 -0
- data/ext/uchardet/src/nsSJISProber.cpp +98 -0
- data/ext/uchardet/src/nsSJISProber.h +81 -0
- data/ext/uchardet/src/nsUTF8Prober.cpp +87 -0
- data/ext/uchardet/src/nsUTF8Prober.h +66 -0
- data/ext/uchardet/src/nsUniversalDetector.cpp +339 -0
- data/ext/uchardet/src/nsUniversalDetector.h +91 -0
- data/ext/uchardet/src/nscore.h +59 -0
- data/ext/uchardet/src/prmem.h +49 -0
- data/ext/uchardet/src/symbols.cmake +41 -0
- data/ext/uchardet/src/tools/CMakeLists.txt +23 -0
- data/ext/uchardet/src/tools/uchardet.cpp +254 -0
- data/ext/uchardet/src/uchardet.cpp +274 -0
- data/ext/uchardet/src/uchardet.h +136 -0
- data/ext/uchardet/test/CMakeLists.txt +47 -0
- data/ext/uchardet/test/ar/iso-8859-6.txt +3 -0
- data/ext/uchardet/test/ar/utf-8.txt +3 -0
- data/ext/uchardet/test/ar/windows-1256.txt +3 -0
- data/ext/uchardet/test/bg/windows-1251.txt +3 -0
- data/ext/uchardet/test/cs/ibm852.txt +4 -0
- data/ext/uchardet/test/cs/iso-8859-2.txt +4 -0
- data/ext/uchardet/test/cs/mac-centraleurope.txt +4 -0
- data/ext/uchardet/test/cs/utf-8.txt +4 -0
- data/ext/uchardet/test/cs/windows-1250.txt +4 -0
- data/ext/uchardet/test/da/iso-8859-1.txt +7 -0
- data/ext/uchardet/test/da/iso-8859-15.txt +10 -0
- data/ext/uchardet/test/da/utf-8.txt +10 -0
- data/ext/uchardet/test/da/windows-1252.txt +10 -0
- data/ext/uchardet/test/de/iso-8859-1.txt +11 -0
- data/ext/uchardet/test/de/windows-1252.txt +11 -0
- data/ext/uchardet/test/el/iso-8859-7.txt +3 -0
- data/ext/uchardet/test/el/utf-8.txt +3 -0
- data/ext/uchardet/test/el/windows-1253.txt +5 -0
- data/ext/uchardet/test/en/ascii.txt +4 -0
- data/ext/uchardet/test/eo/iso-8859-3.txt +7 -0
- data/ext/uchardet/test/es/iso-8859-1.txt +5 -0
- data/ext/uchardet/test/es/iso-8859-15.txt +5 -0
- data/ext/uchardet/test/es/utf-8.txt +5 -0
- data/ext/uchardet/test/es/windows-1252.txt +5 -0
- data/ext/uchardet/test/et/iso-8859-13.txt +6 -0
- data/ext/uchardet/test/et/iso-8859-15.txt +6 -0
- data/ext/uchardet/test/et/iso-8859-4.txt +6 -0
- data/ext/uchardet/test/et/utf-8.txt +6 -0
- data/ext/uchardet/test/et/windows-1252.txt +6 -0
- data/ext/uchardet/test/et/windows-1257.txt +6 -0
- data/ext/uchardet/test/fi/iso-8859-1.txt +8 -0
- data/ext/uchardet/test/fi/utf-8.txt +8 -0
- data/ext/uchardet/test/fr/iso-8859-1.txt +5 -0
- data/ext/uchardet/test/fr/iso-8859-15.txt +16 -0
- data/ext/uchardet/test/fr/utf-16.be +0 -0
- data/ext/uchardet/test/fr/utf-32.le +0 -0
- data/ext/uchardet/test/fr/utf-8.txt +14 -0
- data/ext/uchardet/test/fr/windows-1252.txt +3 -0
- data/ext/uchardet/test/ga/iso-8859-1.txt +6 -0
- data/ext/uchardet/test/ga/utf-8.txt +6 -0
- data/ext/uchardet/test/ga/windows-1252.txt +6 -0
- data/ext/uchardet/test/he/iso-8859-8.txt +2 -0
- data/ext/uchardet/test/he/utf-8.txt +3 -0
- data/ext/uchardet/test/he/windows-1255.txt +1 -0
- data/ext/uchardet/test/hr/ibm852.txt +4 -0
- data/ext/uchardet/test/hr/iso-8859-13.txt +4 -0
- data/ext/uchardet/test/hr/iso-8859-16.txt +4 -0
- data/ext/uchardet/test/hr/iso-8859-2.txt +4 -0
- data/ext/uchardet/test/hr/mac-centraleurope.txt +4 -0
- data/ext/uchardet/test/hr/utf-8.txt +4 -0
- data/ext/uchardet/test/hr/windows-1250.txt +4 -0
- data/ext/uchardet/test/hu/iso-8859-2.txt +3 -0
- data/ext/uchardet/test/hu/windows-1250.txt +1 -0
- data/ext/uchardet/test/it/iso-8859-1.txt +18 -0
- data/ext/uchardet/test/it/utf-8.txt +18 -0
- data/ext/uchardet/test/ja/euc-jp.txt +10 -0
- data/ext/uchardet/test/ja/iso-2022-jp.txt +8 -0
- data/ext/uchardet/test/ja/shift_jis.txt +1 -0
- data/ext/uchardet/test/ja/utf-16be.txt +0 -0
- data/ext/uchardet/test/ja/utf-16le.txt +0 -0
- data/ext/uchardet/test/ja/utf-8.txt +9 -0
- data/ext/uchardet/test/ko/iso-2022-kr.txt +8 -0
- data/ext/uchardet/test/ko/uhc.smi +16 -0
- data/ext/uchardet/test/ko/utf-16.le +0 -0
- data/ext/uchardet/test/ko/utf-32.be +0 -0
- data/ext/uchardet/test/ko/utf-8.txt +3 -0
- data/ext/uchardet/test/lt/iso-8859-10.txt +3 -0
- data/ext/uchardet/test/lt/iso-8859-13.txt +3 -0
- data/ext/uchardet/test/lt/iso-8859-4.txt +3 -0
- data/ext/uchardet/test/lt/utf-8.txt +3 -0
- data/ext/uchardet/test/lv/iso-8859-10.txt +6 -0
- data/ext/uchardet/test/lv/iso-8859-13.txt +6 -0
- data/ext/uchardet/test/lv/iso-8859-4.txt +6 -0
- data/ext/uchardet/test/lv/utf-8.txt +6 -0
- data/ext/uchardet/test/mt/iso-8859-3.txt +4 -0
- data/ext/uchardet/test/mt/utf-8.txt +4 -0
- data/ext/uchardet/test/pl/ibm852.txt +3 -0
- data/ext/uchardet/test/pl/iso-8859-13.txt +3 -0
- data/ext/uchardet/test/pl/iso-8859-16.txt +3 -0
- data/ext/uchardet/test/pl/iso-8859-2.txt +3 -0
- data/ext/uchardet/test/pl/mac-centraleurope.txt +3 -0
- data/ext/uchardet/test/pl/utf-8.txt +3 -0
- data/ext/uchardet/test/pl/windows-1250.txt +3 -0
- data/ext/uchardet/test/pt/iso-8859-1.txt +6 -0
- data/ext/uchardet/test/pt/utf-8.txt +6 -0
- data/ext/uchardet/test/ro/ibm852.txt +9 -0
- data/ext/uchardet/test/ro/iso-8859-16.txt +9 -0
- data/ext/uchardet/test/ro/utf-8.txt +9 -0
- data/ext/uchardet/test/ro/windows-1250.txt +9 -0
- data/ext/uchardet/test/ru/ibm855.txt +5 -0
- data/ext/uchardet/test/ru/ibm866.txt +11 -0
- data/ext/uchardet/test/ru/iso-8859-5.txt +3 -0
- data/ext/uchardet/test/ru/koi8-r.txt +1 -0
- data/ext/uchardet/test/ru/mac-cyrillic.txt +9 -0
- data/ext/uchardet/test/ru/windows-1251.txt +4 -0
- data/ext/uchardet/test/sk/ibm852.txt +3 -0
- data/ext/uchardet/test/sk/iso-8859-2.txt +3 -0
- data/ext/uchardet/test/sk/mac-centraleurope.txt +3 -0
- data/ext/uchardet/test/sk/utf-8.txt +3 -0
- data/ext/uchardet/test/sk/windows-1250.txt +3 -0
- data/ext/uchardet/test/sl/ibm852.txt +9 -0
- data/ext/uchardet/test/sl/iso-8859-16.txt +9 -0
- data/ext/uchardet/test/sl/iso-8859-2.txt +9 -0
- data/ext/uchardet/test/sl/mac-centraleurope.txt +9 -0
- data/ext/uchardet/test/sl/utf-8.txt +9 -0
- data/ext/uchardet/test/sl/windows-1250.txt +9 -0
- data/ext/uchardet/test/sv/iso-8859-1.txt +10 -0
- data/ext/uchardet/test/sv/utf-8.txt +10 -0
- data/ext/uchardet/test/sv/windows-1252.txt +10 -0
- data/ext/uchardet/test/th/iso-8859-11.txt +5 -0
- data/ext/uchardet/test/th/tis-620.txt +5 -0
- data/ext/uchardet/test/th/utf-8.txt +1 -0
- data/ext/uchardet/test/tr/iso-8859-3.txt +13 -0
- data/ext/uchardet/test/tr/iso-8859-9.txt +13 -0
- data/ext/uchardet/test/uchardet-tests.c +130 -0
- data/ext/uchardet/test/vi/utf-8.txt +4 -0
- data/ext/uchardet/test/vi/viscii.txt +4 -0
- data/ext/uchardet/test/vi/windows-1258.txt +4 -0
- data/ext/uchardet/test/zh/big5.txt +1 -0
- data/ext/uchardet/test/zh/euc-tw.txt +1 -0
- data/ext/uchardet/test/zh/gb18030.txt +1 -0
- data/ext/uchardet/test/zh/utf-8.txt +1 -0
- data/ext/uchardet/uchardet.doap +51 -0
- data/ext/uchardet/uchardet.pc.in +10 -0
- data/lib/cchardet.rb +56 -0
- data/lib/cchardet/lib_finder.rb +32 -0
- data/lib/cchardet/version.rb +5 -0
- metadata +362 -0
|
@@ -0,0 +1,166 @@
|
|
|
1
|
+
= Logs of language model for Portuguese (pt) =
|
|
2
|
+
|
|
3
|
+
- Generated by BuildLangModel.py
|
|
4
|
+
- Started: 2016-09-20 23:44:39.722451
|
|
5
|
+
- Maximum depth: 5
|
|
6
|
+
- Max number of pages: 100
|
|
7
|
+
|
|
8
|
+
== Parsed pages ==
|
|
9
|
+
|
|
10
|
+
Papagaio-das-mascarenhas (revision 46763149)
|
|
11
|
+
Albinismo (revision 46498446)
|
|
12
|
+
Alfred Newton (revision 43617011)
|
|
13
|
+
Alphonse Milne-Edwards (revision 39740747)
|
|
14
|
+
Animalia (revision 46727732)
|
|
15
|
+
Asa (revision 46338820)
|
|
16
|
+
August von Pelzeln (revision 34726241)
|
|
17
|
+
Aves (revision 46728980)
|
|
18
|
+
Bico (revision 45311553)
|
|
19
|
+
Carl Wilhelm Hahn (revision 45025566)
|
|
20
|
+
Carlos Lineu (revision 46625396)
|
|
21
|
+
Carolus Linnaeus (revision 46625396)
|
|
22
|
+
Cauda (revision 43275401)
|
|
23
|
+
Charles Lucien Bonaparte (revision 45529712)
|
|
24
|
+
Chordata (revision 46640101)
|
|
25
|
+
Cladograma (revision 46700307)
|
|
26
|
+
Classe (biologia) (revision 46701409)
|
|
27
|
+
Classificação científica (revision 46306288)
|
|
28
|
+
Coleção Leverian (revision 45026647)
|
|
29
|
+
Comores (revision 46181501)
|
|
30
|
+
Coracopsinae (revision 36946101)
|
|
31
|
+
Coracopsis nigra (revision 44338845)
|
|
32
|
+
Coracopsis vasa (revision 42905822)
|
|
33
|
+
Cylindraspis indica (revision 42905410)
|
|
34
|
+
Cúlmen (revision 45311553)
|
|
35
|
+
Digital object identifier (revision 42172651)
|
|
36
|
+
Eclectus roratus (revision 44380798)
|
|
37
|
+
Edward Newton (revision 39261469)
|
|
38
|
+
Endemismo (revision 45260961)
|
|
39
|
+
Epíteto específico (revision 35101647)
|
|
40
|
+
Espécie (revision 45685675)
|
|
41
|
+
Esquilo-vermelho (revision 43489595)
|
|
42
|
+
Estado de conservação (revision 46662839)
|
|
43
|
+
Extinção (revision 46526607)
|
|
44
|
+
Família (biologia) (revision 46636004)
|
|
45
|
+
Filo (revision 46704246)
|
|
46
|
+
França (revision 46740839)
|
|
47
|
+
François-Nicolas Martinet (revision 43679514)
|
|
48
|
+
François Levaillant (revision 40142351)
|
|
49
|
+
Fredrik Hasselqvist (revision 44381122)
|
|
50
|
+
Fregilupus varius (revision 46555765)
|
|
51
|
+
Fumigação (revision 42458244)
|
|
52
|
+
George Robert Gray (revision 39047844)
|
|
53
|
+
Georges-Louis Leclerc, conde de Buffon (revision 45622418)
|
|
54
|
+
Género (biologia) (revision 45296588)
|
|
55
|
+
Hermann Schlegel (revision 43137605)
|
|
56
|
+
Herpetologista (revision 46207704)
|
|
57
|
+
Histoire Naturelle (revision 44293456)
|
|
58
|
+
Holótipo (revision 44029660)
|
|
59
|
+
Ilha da Reunião (revision 45458206)
|
|
60
|
+
Ilha vulcânica (revision 37924535)
|
|
61
|
+
Ilhas Mascarenhas (revision 45858660)
|
|
62
|
+
Ilhas Molucas (revision 45476933)
|
|
63
|
+
International Standard Book Number (revision 46326494)
|
|
64
|
+
Jacques Barraband (revision 45007769)
|
|
65
|
+
Jean Feuilley (revision 43140791)
|
|
66
|
+
Johann Georg Wagler (revision 34585234)
|
|
67
|
+
John Gerrard Keulemans (revision 39664498)
|
|
68
|
+
Julian Hume (revision 41876605)
|
|
69
|
+
Leiolopisma (revision 43997173)
|
|
70
|
+
Lionel Walter Rothschild (revision 46022922)
|
|
71
|
+
Lista Vermelha da IUCN (revision 46569884)
|
|
72
|
+
Lista Vermelha da União Internacional para a Conservação da Natureza e dos Recursos Naturais (revision 46569884)
|
|
73
|
+
Lista Vermelha de Espécies Ameaçadas da IUCN (revision 46569884)
|
|
74
|
+
Lista de aves extintas (revision 45507420)
|
|
75
|
+
Londres (revision 46310311)
|
|
76
|
+
Língua inglesa (revision 46609785)
|
|
77
|
+
Madagascar (revision 46617630)
|
|
78
|
+
Mascarenotus grucheti (revision 43145662)
|
|
79
|
+
Mathurin Jacques Brisson (revision 36018826)
|
|
80
|
+
Maurício (revision 46723599)
|
|
81
|
+
Maximiliano I José da Baviera (revision 46372080)
|
|
82
|
+
Melanina (revision 46762903)
|
|
83
|
+
Museu Nacional de História Natural (França) (revision 43731807)
|
|
84
|
+
Naturhistorisches Museum (revision 46694247)
|
|
85
|
+
Nesoenas duboisi (revision 43995805)
|
|
86
|
+
Nome científico (revision 46671641)
|
|
87
|
+
Nomenclatura binomial (revision 46671641)
|
|
88
|
+
Nycticorax duboisi (revision 43816214)
|
|
89
|
+
Nível do mar (revision 46414695)
|
|
90
|
+
Ordem (biologia) (revision 46360024)
|
|
91
|
+
Otto Finsch (revision 42362273)
|
|
92
|
+
Papagaio (revision 46738207)
|
|
93
|
+
Papagaio-cinzento (revision 46673943)
|
|
94
|
+
Papagaio-cinzento-de-maurício (revision 46664408)
|
|
95
|
+
Pedro Mascarenhas (c. 1484-1555) (revision 45541977)
|
|
96
|
+
Periquito-de-maurício (revision 43010883)
|
|
97
|
+
Periquito-de-reunião (revision 43048764)
|
|
98
|
+
Peter Mundy (revision 43563846)
|
|
99
|
+
Piton des Neiges (revision 45632497)
|
|
100
|
+
Pleistoceno (revision 45916874)
|
|
101
|
+
Plumagem (revision 34951058)
|
|
102
|
+
Ponto quente (revision 45375495)
|
|
103
|
+
Porphyrio coerulescens (revision 43672493)
|
|
104
|
+
Praslin (revision 40728143)
|
|
105
|
+
Psitacídeos (revision 46598835)
|
|
106
|
+
Psittaciformes (revision 46598835)
|
|
107
|
+
Psittacula (revision 42856453)
|
|
108
|
+
Psittaculinae (revision 46760737)
|
|
109
|
+
Psittaculini (revision 43015966)
|
|
110
|
+
Psittrichasiidae (revision 44385977)
|
|
111
|
+
|
|
112
|
+
== End of Parsed pages ==
|
|
113
|
+
|
|
114
|
+
- Wikipedia parsing ended at: 2016-09-20 23:47:27.346826
|
|
115
|
+
|
|
116
|
+
51 characters appeared 558324 times.
|
|
117
|
+
|
|
118
|
+
First 38 characters:
|
|
119
|
+
[ 0] Char a: 11.864795351802895 %
|
|
120
|
+
[ 1] Char e: 11.44604208309154 %
|
|
121
|
+
[ 2] Char o: 9.868284365350585 %
|
|
122
|
+
[ 3] Char s: 8.346587286235232 %
|
|
123
|
+
[ 4] Char i: 7.118089138206489 %
|
|
124
|
+
[ 5] Char r: 6.394136737808154 %
|
|
125
|
+
[ 6] Char n: 5.568272186042513 %
|
|
126
|
+
[ 7] Char d: 5.243192125002687 %
|
|
127
|
+
[ 8] Char t: 4.80061756256224 %
|
|
128
|
+
[ 9] Char m: 4.498105042949971 %
|
|
129
|
+
[10] Char c: 3.9747530107965985 %
|
|
130
|
+
[11] Char u: 3.7229279056605127 %
|
|
131
|
+
[12] Char l: 3.207814817202914 %
|
|
132
|
+
[13] Char p: 2.77562848811801 %
|
|
133
|
+
[14] Char g: 1.3850380782484721 %
|
|
134
|
+
[15] Char v: 1.3210967108703908 %
|
|
135
|
+
[16] Char f: 1.122466524813549 %
|
|
136
|
+
[17] Char b: 0.9702251739133549 %
|
|
137
|
+
[18] Char h: 0.9130898904578704 %
|
|
138
|
+
[19] Char é: 0.7026386112723079 %
|
|
139
|
+
[20] Char ã: 0.7022803963290133 %
|
|
140
|
+
[21] Char q: 0.5903382265494588 %
|
|
141
|
+
[22] Char ç: 0.5856814322866293 %
|
|
142
|
+
[23] Char í: 0.41391736697688086 %
|
|
143
|
+
[24] Char x: 0.3913498255493226 %
|
|
144
|
+
[25] Char á: 0.34567742027926435 %
|
|
145
|
+
[26] Char z: 0.3170202248156984 %
|
|
146
|
+
[27] Char ó: 0.22925756370852768 %
|
|
147
|
+
[28] Char j: 0.20454073262120204 %
|
|
148
|
+
[29] Char ê: 0.20239144296143458 %
|
|
149
|
+
[30] Char õ: 0.16155493942585308 %
|
|
150
|
+
[31] Char y: 0.15080849112701586 %
|
|
151
|
+
[32] Char w: 0.09241945537000021 %
|
|
152
|
+
[33] Char ú: 0.08794176857881804 %
|
|
153
|
+
[34] Char k: 0.08364318925928313 %
|
|
154
|
+
[35] Char â: 0.07898639499645367 %
|
|
155
|
+
[36] Char à: 0.06859816164091102 %
|
|
156
|
+
[37] Char ô: 0.031164700066627977 %
|
|
157
|
+
|
|
158
|
+
The first 38 characters have an accumulated ratio of 0.9998137282294869.
|
|
159
|
+
|
|
160
|
+
891 sequences found.
|
|
161
|
+
|
|
162
|
+
First 512 (typical positive ratio): 0.9953179582313172
|
|
163
|
+
Next 512 (512-1024): 1.7910747164728723e-06
|
|
164
|
+
Rest: 2.42861286636753e-17
|
|
165
|
+
|
|
166
|
+
- Processing end: 2016-09-20 23:47:27.489355
|
|
@@ -0,0 +1,153 @@
|
|
|
1
|
+
= Logs of language model for Romanian (ro) =
|
|
2
|
+
|
|
3
|
+
- Generated by BuildLangModel.py
|
|
4
|
+
- Started: 2016-09-28 18:53:56.086095
|
|
5
|
+
- Maximum depth: 5
|
|
6
|
+
- Max number of pages: 100
|
|
7
|
+
|
|
8
|
+
== Parsed pages ==
|
|
9
|
+
|
|
10
|
+
The Loving Kind (revision 10166481)
|
|
11
|
+
12 ianuarie (revision 10711676)
|
|
12
|
+
13 decembrie (revision 9938353)
|
|
13
|
+
2007 (revision 10716321)
|
|
14
|
+
2008 (revision 10752084)
|
|
15
|
+
2009 (revision 10654003)
|
|
16
|
+
21 noiembrie (revision 10447643)
|
|
17
|
+
25 ianuarie (revision 10228199)
|
|
18
|
+
31 ianuarie (revision 10718063)
|
|
19
|
+
4 Music (revision 9701591)
|
|
20
|
+
Billboard (revision 10505294)
|
|
21
|
+
Biology (revision 10112430)
|
|
22
|
+
Bulgaria (revision 10481051)
|
|
23
|
+
CD (revision 10477531)
|
|
24
|
+
Call The Shots (revision 10101027)
|
|
25
|
+
Call the Shots (revision 10101027)
|
|
26
|
+
Can't Speak French (revision 9721506)
|
|
27
|
+
Casă de discuri (revision 10611348)
|
|
28
|
+
Channel 4 (revision 7953101)
|
|
29
|
+
Chemistry (revision 10112479)
|
|
30
|
+
Cheryl Cole (revision 10475016)
|
|
31
|
+
Chitară (revision 10468266)
|
|
32
|
+
Croația (revision 10737746)
|
|
33
|
+
Dance (revision 10231736)
|
|
34
|
+
Descărcare digitală (revision 10100743)
|
|
35
|
+
Digital Spy (revision 9044016)
|
|
36
|
+
Discografia Girls Aloud (revision 10172788)
|
|
37
|
+
Estonia (revision 10749810)
|
|
38
|
+
Europa (revision 10752724)
|
|
39
|
+
Fascination Records (revision 9655292)
|
|
40
|
+
Fiona Phillips (revision 5384082)
|
|
41
|
+
Gen muzical (revision 10534645)
|
|
42
|
+
Girls A Live (revision 10112444)
|
|
43
|
+
Girls Aloud (revision 10112446)
|
|
44
|
+
Good Morning Television (revision 10166481)
|
|
45
|
+
Heat World (revision 10166481)
|
|
46
|
+
I'll Stand By You (cântec de Girls Aloud) (revision 10112432)
|
|
47
|
+
ITunes (revision 10744174)
|
|
48
|
+
I Think We're Alone Now (revision 10112427)
|
|
49
|
+
Irlanda (revision 10573806)
|
|
50
|
+
Jump (cântec de Girls Aloud) (revision 10112438)
|
|
51
|
+
Lady GaGa (revision 10753010)
|
|
52
|
+
Life Got Cold (revision 10112437)
|
|
53
|
+
Limba engleză (revision 10756676)
|
|
54
|
+
Long Hot Summer (revision 10112429)
|
|
55
|
+
Love Machine (revision 10112433)
|
|
56
|
+
MSN Search (revision 10653298)
|
|
57
|
+
MTV (revision 10170766)
|
|
58
|
+
Mixed Up (revision 10112443)
|
|
59
|
+
Muzică electronică (revision 10608432)
|
|
60
|
+
Muzică pop (revision 10740529)
|
|
61
|
+
Nadine Coyle (revision 10316187)
|
|
62
|
+
Neil Tennant (revision 10499980)
|
|
63
|
+
No Good Advice (revision 10112436)
|
|
64
|
+
Out Of Control (revision 10112484)
|
|
65
|
+
Out of Control (revision 10112484)
|
|
66
|
+
Pet Shop Boys (revision 10612741)
|
|
67
|
+
Poker Face (revision 10496402)
|
|
68
|
+
PopJustice (revision 10625677)
|
|
69
|
+
Regatul Unit (revision 10752338)
|
|
70
|
+
Regatul Unit al Marii Britanii și Irlandei de Nord (revision 10752338)
|
|
71
|
+
Regatul Unit al Marii Britanii și al Irlandei de Nord (revision 10752338)
|
|
72
|
+
Republica Irlanda (revision 10573806)
|
|
73
|
+
Romanian Top 100 (revision 10736281)
|
|
74
|
+
România (revision 10732435)
|
|
75
|
+
Sarah Harding (revision 10633651)
|
|
76
|
+
Sarah Hearding (revision 10112425)
|
|
77
|
+
See the Day (revision 10112431)
|
|
78
|
+
Sexy! No No No... (revision 10112425)
|
|
79
|
+
Slant Magazine (revision 7697473)
|
|
80
|
+
Slovenia (revision 10521499)
|
|
81
|
+
Something Kinda Ooooh (revision 10112426)
|
|
82
|
+
Sound of the Underground (album) (revision 10112476)
|
|
83
|
+
Sound of the Underground (cântec) (revision 10112434)
|
|
84
|
+
Tangled Up (revision 10112482)
|
|
85
|
+
The Guardian (revision 9752334)
|
|
86
|
+
The Paul O'Grady Show (revision 10101027)
|
|
87
|
+
The Promise (revision 10166482)
|
|
88
|
+
The Show (revision 10112441)
|
|
89
|
+
The Sound of Girls Aloud (revision 10112480)
|
|
90
|
+
Tonalitate (revision 9966362)
|
|
91
|
+
Turneul Out of Control (revision 10112446)
|
|
92
|
+
UK Mix (revision 9721468)
|
|
93
|
+
UK Singles Chart (revision 10226705)
|
|
94
|
+
Ungaria (revision 10737745)
|
|
95
|
+
Uniunea Europeană (revision 10751590)
|
|
96
|
+
Untouchable (revision 10112410)
|
|
97
|
+
Wake Me Up (revision 10112439)
|
|
98
|
+
What Will The Neighbours Say? (revision 10112478)
|
|
99
|
+
Whole Lotta History (revision 10475020)
|
|
100
|
+
Wideboys (revision 10166481)
|
|
101
|
+
Wikimedia Commons (revision 9703907)
|
|
102
|
+
Xenomania (revision 10112484)
|
|
103
|
+
|
|
104
|
+
== End of Parsed pages ==
|
|
105
|
+
|
|
106
|
+
- Wikipedia parsing ended at: 2016-09-28 18:58:13.756622
|
|
107
|
+
|
|
108
|
+
60 characters appeared 883554 times.
|
|
109
|
+
|
|
110
|
+
First 33 characters:
|
|
111
|
+
[ 0] Char e: 11.67014127036944 %
|
|
112
|
+
[ 1] Char i: 10.97567324690964 %
|
|
113
|
+
[ 2] Char a: 10.080198833348046 %
|
|
114
|
+
[ 3] Char r: 7.490657050955572 %
|
|
115
|
+
[ 4] Char n: 7.18246988865423 %
|
|
116
|
+
[ 5] Char t: 6.516296683620921 %
|
|
117
|
+
[ 6] Char l: 5.595130574928075 %
|
|
118
|
+
[ 7] Char u: 5.551217016730161 %
|
|
119
|
+
[ 8] Char o: 4.922732509840938 %
|
|
120
|
+
[ 9] Char c: 4.495707110148333 %
|
|
121
|
+
[10] Char s: 3.8308920563994957 %
|
|
122
|
+
[11] Char d: 3.590499279048027 %
|
|
123
|
+
[12] Char m: 2.971408651876399 %
|
|
124
|
+
[13] Char p: 2.902369294915761 %
|
|
125
|
+
[14] Char ă: 2.1349006399156134 %
|
|
126
|
+
[15] Char g: 1.2248261000459508 %
|
|
127
|
+
[16] Char f: 1.1199089133205216 %
|
|
128
|
+
[17] Char b: 1.0781457613230203 %
|
|
129
|
+
[18] Char ț: 1.0323081554721047 %
|
|
130
|
+
[19] Char ș: 0.9732285745975912 %
|
|
131
|
+
[20] Char î: 0.97017273420753 %
|
|
132
|
+
[21] Char v: 0.9693804792915882 %
|
|
133
|
+
[22] Char z: 0.7369102510995367 %
|
|
134
|
+
[23] Char h: 0.533413916976212 %
|
|
135
|
+
[24] Char â: 0.4986678799484808 %
|
|
136
|
+
[25] Char x: 0.22081276300033725 %
|
|
137
|
+
[26] Char j: 0.20055367300696958 %
|
|
138
|
+
[27] Char k: 0.1901411798260208 %
|
|
139
|
+
[28] Char y: 0.15471606715605385 %
|
|
140
|
+
[29] Char w: 0.11827234102273318 %
|
|
141
|
+
[30] Char á: 0.016297815413658927 %
|
|
142
|
+
[31] Char é: 0.013355154297303842 %
|
|
143
|
+
[32] Char q: 0.00520624659047438 %
|
|
144
|
+
|
|
145
|
+
The first 33 characters have an accumulated ratio of 0.9996661211425673.
|
|
146
|
+
|
|
147
|
+
981 sequences found.
|
|
148
|
+
|
|
149
|
+
First 512 (typical positive ratio): 0.997762564143313
|
|
150
|
+
Next 512 (512-1024): 1.1317927370596478e-06
|
|
151
|
+
Rest: 3.0357660829594124e-18
|
|
152
|
+
|
|
153
|
+
- Processing end: 2016-09-28 18:58:13.862425
|
|
@@ -0,0 +1,158 @@
|
|
|
1
|
+
= Logs of language model for Slovak (sk) =
|
|
2
|
+
|
|
3
|
+
- Generated by BuildLangModel.py
|
|
4
|
+
- Started: 2016-09-21 13:26:28.712674
|
|
5
|
+
- Maximum depth: 5
|
|
6
|
+
- Max number of pages: 100
|
|
7
|
+
|
|
8
|
+
== Parsed pages ==
|
|
9
|
+
|
|
10
|
+
Dôkaz (matematika) (revision 6358810)
|
|
11
|
+
1825 (revision 6122752)
|
|
12
|
+
1839 (revision 6165808)
|
|
13
|
+
1847 (revision 5941780)
|
|
14
|
+
1852 (revision 5941777)
|
|
15
|
+
1878 (revision 6221358)
|
|
16
|
+
1955 (revision 6226609)
|
|
17
|
+
1976 (revision 6310709)
|
|
18
|
+
1983 (revision 6356952)
|
|
19
|
+
1993 (revision 6348358)
|
|
20
|
+
1995 (revision 6277350)
|
|
21
|
+
2012 (revision 6291145)
|
|
22
|
+
Adrien-Marie Legendre (revision 6060342)
|
|
23
|
+
Algebra (revision 6319238)
|
|
24
|
+
Algebraická geometria (revision 5964212)
|
|
25
|
+
Algebraická rovnica (revision 5288111)
|
|
26
|
+
Algebrické číslo (revision 6106622)
|
|
27
|
+
Algoritmus (revision 6286937)
|
|
28
|
+
Andrew Wiles (revision 5791970)
|
|
29
|
+
Arabi (revision 6044956)
|
|
30
|
+
Arabčina (revision 6322514)
|
|
31
|
+
Aristoteles (revision 6359959)
|
|
32
|
+
Arthur Cayley (revision 6332355)
|
|
33
|
+
Axióma (revision 6338092)
|
|
34
|
+
Babylonia (revision 6168813)
|
|
35
|
+
Bernard Bolzano (revision 6261374)
|
|
36
|
+
Boh (revision 6282272)
|
|
37
|
+
Bolzanova veta (revision 6345299)
|
|
38
|
+
Bytie (revision 5274918)
|
|
39
|
+
Byzantská ríša (revision 6359782)
|
|
40
|
+
Caroline Blundenová (revision 6358810)
|
|
41
|
+
Cauchyho postupnosť (revision 6215169)
|
|
42
|
+
Celé číslo (revision 6302805)
|
|
43
|
+
Charles Hermite (revision 5751036)
|
|
44
|
+
Daniel Marcus (revision 5657431)
|
|
45
|
+
David Hilbert (revision 5968866)
|
|
46
|
+
Dedukcia (revision 6338099)
|
|
47
|
+
Definícia (revision 6106684)
|
|
48
|
+
Derivácia (funkcia) (revision 5970574)
|
|
49
|
+
Desiatková číselná sústava (revision 5924486)
|
|
50
|
+
Diofantická rovnica (revision 6327292)
|
|
51
|
+
Dynastia Chan (revision 6342042)
|
|
52
|
+
Dôkaz (logika) (revision 5495754)
|
|
53
|
+
Dôkaz sporom (revision 5940134)
|
|
54
|
+
Dôkaz výpočtom (revision 6358810)
|
|
55
|
+
Energia (revision 6277761)
|
|
56
|
+
Eric Weisstein (revision 6054413)
|
|
57
|
+
Ernst Kummer (revision 6001344)
|
|
58
|
+
Európa (revision 6295124)
|
|
59
|
+
Experiment (revision 6354302)
|
|
60
|
+
Fenomén (filozofia) (revision 5420897)
|
|
61
|
+
Filozofia (revision 6296369)
|
|
62
|
+
Formula (logika) (revision 3916562)
|
|
63
|
+
Formálny dôkaz (revision 6358810)
|
|
64
|
+
Formálny jazyk (revision 5623029)
|
|
65
|
+
Gabriel Cramer (revision 5923903)
|
|
66
|
+
Galoisova teória (revision 6353573)
|
|
67
|
+
Gentzenovský kalkul (revision 6358810)
|
|
68
|
+
Geometria (revision 5970028)
|
|
69
|
+
Geometrický dôkaz (revision 6358810)
|
|
70
|
+
Georg Ferdinand Cantor (revision 6186696)
|
|
71
|
+
Giordano Bruno (revision 6312876)
|
|
72
|
+
Gottlob Frege (revision 5968855)
|
|
73
|
+
Gödelova veta o neúplnosti (revision 5323549)
|
|
74
|
+
Hardvér (revision 6214401)
|
|
75
|
+
Henri Poincaré (revision 6315506)
|
|
76
|
+
Hilbertovský kalkul (revision 6358810)
|
|
77
|
+
Hmotnosť (revision 5979540)
|
|
78
|
+
Hypotéza (revision 5983410)
|
|
79
|
+
Idea (revision 5960449)
|
|
80
|
+
India (revision 6362189)
|
|
81
|
+
Intuícia (revision 5837951)
|
|
82
|
+
Jazyk (lingvistika) (revision 6073293)
|
|
83
|
+
John Taylor (revision 6355518)
|
|
84
|
+
Kardinálne číslo (revision 6090126)
|
|
85
|
+
Kenneth Appel (revision 5968422)
|
|
86
|
+
Klasická mechanika (revision 6295646)
|
|
87
|
+
Konečná množina (revision 5276494)
|
|
88
|
+
Konfucianizmus (revision 5968816)
|
|
89
|
+
Kresťanstvo (revision 6289571)
|
|
90
|
+
Langlandsov program (revision 6088475)
|
|
91
|
+
Latinčina (revision 6121105)
|
|
92
|
+
Leonhard Euler (revision 6339382)
|
|
93
|
+
Lineárna algebra (revision 5473535)
|
|
94
|
+
Logická axióma (revision 5495754)
|
|
95
|
+
Logický kalkul (revision 1608550)
|
|
96
|
+
|
|
97
|
+
== End of Parsed pages ==
|
|
98
|
+
|
|
99
|
+
- Wikipedia parsing ended at: 2016-09-21 13:33:10.330458
|
|
100
|
+
|
|
101
|
+
62 characters appeared 550293 times.
|
|
102
|
+
|
|
103
|
+
First 45 characters:
|
|
104
|
+
[ 0] Char o: 8.867094438780795 %
|
|
105
|
+
[ 1] Char a: 8.59705647718579 %
|
|
106
|
+
[ 2] Char e: 8.562347694773512 %
|
|
107
|
+
[ 3] Char n: 6.0867574183207855 %
|
|
108
|
+
[ 4] Char i: 5.828531346028389 %
|
|
109
|
+
[ 5] Char t: 5.366595613609477 %
|
|
110
|
+
[ 6] Char r: 4.977711873492848 %
|
|
111
|
+
[ 7] Char k: 4.264273759615332 %
|
|
112
|
+
[ 8] Char s: 4.257731790155426 %
|
|
113
|
+
[ 9] Char v: 4.117079446767449 %
|
|
114
|
+
[10] Char l: 3.5979014815743615 %
|
|
115
|
+
[11] Char d: 3.416361829061972 %
|
|
116
|
+
[12] Char m: 3.2513588215732345 %
|
|
117
|
+
[13] Char p: 2.878466562358598 %
|
|
118
|
+
[14] Char u: 2.5987973679476206 %
|
|
119
|
+
[15] Char c: 2.419438371921867 %
|
|
120
|
+
[16] Char z: 2.127412124086623 %
|
|
121
|
+
[17] Char h: 2.0687161203213558 %
|
|
122
|
+
[18] Char j: 2.0312815173007834 %
|
|
123
|
+
[19] Char y: 1.6700194260148686 %
|
|
124
|
+
[20] Char b: 1.6574806512167153 %
|
|
125
|
+
[21] Char á: 1.6422160558102683 %
|
|
126
|
+
[22] Char ý: 1.2564215790497062 %
|
|
127
|
+
[23] Char í: 1.1326693234331529 %
|
|
128
|
+
[24] Char č: 0.9473135220691523 %
|
|
129
|
+
[25] Char é: 0.8913433389121795 %
|
|
130
|
+
[26] Char ž: 0.7668641978000811 %
|
|
131
|
+
[27] Char ú: 0.6949025337411161 %
|
|
132
|
+
[28] Char š: 0.6785476100913513 %
|
|
133
|
+
[29] Char f: 0.6514711253822963 %
|
|
134
|
+
[30] Char g: 0.6096752093884531 %
|
|
135
|
+
[31] Char ť: 0.46375294615777407 %
|
|
136
|
+
[32] Char ô: 0.4172322744428877 %
|
|
137
|
+
[33] Char ľ: 0.36053520579036985 %
|
|
138
|
+
[34] Char x: 0.23114958758334195 %
|
|
139
|
+
[35] Char ó: 0.2251527822450949 %
|
|
140
|
+
[36] Char ň: 0.09304134342977287 %
|
|
141
|
+
[37] Char w: 0.09013380144759246 %
|
|
142
|
+
[38] Char ä: 0.0694175648245571 %
|
|
143
|
+
[39] Char ď: 0.06560141597294532 %
|
|
144
|
+
[40] Char q: 0.01726353051919614 %
|
|
145
|
+
[41] Char ě: 0.009994675563745132 %
|
|
146
|
+
[42] Char ĺ: 0.009267790068200032 %
|
|
147
|
+
[43] Char ö: 0.008904347320427481 %
|
|
148
|
+
[44] Char ŕ: 0.00599680533824708 %
|
|
149
|
+
|
|
150
|
+
The first 45 characters have an accumulated ratio of 0.9998128269848972.
|
|
151
|
+
|
|
152
|
+
1181 sequences found.
|
|
153
|
+
|
|
154
|
+
First 512 (typical positive ratio): 0.9733303573968434
|
|
155
|
+
Next 512 (512-1024): 1.8172137388627513e-06
|
|
156
|
+
Rest: 0.0003522983638913346
|
|
157
|
+
|
|
158
|
+
- Processing end: 2016-09-21 13:33:10.831531
|