commit dc5c142e3eefd21d071bd6b42c0436fe99455a62 parent 175899376eb728e3a545108e5c16a906f9e46234 Author: Christian Grothoff <christian@grothoff.org> Date: Wed, 14 Sep 2005 06:36:43 +0000 language detection code from libkat 0.6.3 Diffstat:
| M | AUTHORS | | | 1 | + |
| A | src/plugins/language/Makefile.am | | | 15 | +++++++++++++++ |
| A | src/plugins/language/Makefile.in | | | 605 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/afrikaans.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/albanian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/arabic.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/arabic2.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/armenian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/basque.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/belarus.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/bosnian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/breton.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/bulgarian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/catalan.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/chinese.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/chinese1.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/chinese2.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/croatian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/czech.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/danish.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/dutch.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/english.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/esperanto.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/estonian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/finnish.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/french.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/frisian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/georgian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/german.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/greek.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/hawaian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/hebrew.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/hindi.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/hungarian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/icelandic.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/indonesian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/irish.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/italian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/japanese-euc_jp.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/japanese-shift_jis.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/katlanguagemanager.cpp | | | 310 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/korean.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/latin.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/latvian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/lithuanian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/malay.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/manx.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/marathi.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/mf.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/middle-frisian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/mingo.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/nepali.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/norwegian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/persian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/polish.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/portuguese.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/quechua.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/romanian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/rumantsch.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/russian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/russian1.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/russian2.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/sanskrit.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/scots.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/scots_gaelic.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/serbian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/slovak.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/slovak2.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/slovenian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/slovenian2.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/spanish.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/swahili.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/tagalog.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/tamil.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/thai.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/turkish.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/ukrainian.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/vietnamese.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
| A | src/plugins/language/welsh.klp | | | 404 | +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
79 files changed, 31231 insertions(+), 0 deletions(-)
diff --git a/AUTHORS b/AUTHORS @@ -30,6 +30,7 @@ hash - core team using GNU coreutils/textutils and GPL'ed RMD160 code. translit - Nils Durner <n.durner@t-online.de> thumbnail - core team using ImageMagick exiv2 - Andreas Huggel <ahuggel@gmx.net> +language - Roberto Cappuccio <roberto.cappuccio@gmail.com> (from libkat) General contributors: Yuri N. Sedunov <aris@altlinux.ru> diff --git a/src/plugins/language/Makefile.am b/src/plugins/language/Makefile.am @@ -0,0 +1,15 @@ +languagedir = $(datadir)/libextractor/language + +language_DATA = afrikaans.klp albanian.klp arabic2.klp arabic.klp armenian.klp \ + basque.klp belarus.klp bosnian.klp breton.klp bulgarian.klp catalan.klp \ + chinese1.klp chinese2.klp chinese.klp croatian.klp czech.klp danish.klp dutch.klp \ + english.klp esperanto.klp estonian.klp finnish.klp french.klp frisian.klp \ + georgian.klp german.klp greek.klp hawaian.klp hebrew.klp hindi.klp hungarian.klp \ + icelandic.klp indonesian.klp irish.klp italian.klp japanese-euc_jp.klp \ + japanese-shift_jis.klp korean.klp latin.klp latvian.klp lithuanian.klp malay.klp \ + manx.klp marathi.klp mf.klp middle-frisian.klp mingo.klp nepali.klp norwegian.klp \ + persian.klp polish.klp portuguese.klp quechua.klp romanian.klp rumantsch.klp \ + russian1.klp russian2.klp russian.klp sanskrit.klp scots_gaelic.klp scots.klp \ + serbian.klp slovak2.klp slovak.klp slovenian2.klp slovenian.klp spanish.klp \ + swahili.klp tagalog.klp tamil.klp thai.klp turkish.klp ukrainian.klp \ + vietnamese.klp welsh.klp diff --git a/src/plugins/language/Makefile.in b/src/plugins/language/Makefile.in @@ -0,0 +1,605 @@ +# Makefile.in generated by automake 1.9.4 from Makefile.am. +# KDE tags expanded automatically by am_edit - $Revision: 435799 $ +# @configure_input@ + +# Copyright (C) 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, +# 2003, 2004 Free Software Foundation, Inc. +# This Makefile.in is free software; the Free Software Foundation +# gives unlimited permission to copy and/or distribute it, +# with or without modifications, as long as this notice is preserved. + +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY, to the extent permitted by law; without +# even the implied warranty of MERCHANTABILITY or FITNESS FOR A +# PARTICULAR PURPOSE. + +@SET_MAKE@ + +srcdir = @srcdir@ +top_srcdir = @top_srcdir@ +VPATH = @srcdir@ +pkgdatadir = $(datadir)/@PACKAGE@ +pkglibdir = $(libdir)/@PACKAGE@ +pkgincludedir = $(includedir)/@PACKAGE@ +top_builddir = ../../.. +am__cd = CDPATH="$${ZSH_VERSION+.}$(PATH_SEPARATOR)" && cd +INSTALL = @INSTALL@ +install_sh_DATA = $(install_sh) -c -m 644 +install_sh_PROGRAM = $(install_sh) -c +install_sh_SCRIPT = $(install_sh) -c +INSTALL_HEADER = $(INSTALL_DATA) +transform = $(program_transform_name) +NORMAL_INSTALL = : +PRE_INSTALL = : +POST_INSTALL = : +NORMAL_UNINSTALL = : +PRE_UNINSTALL = : +POST_UNINSTALL = : +build_triplet = @build@ +host_triplet = @host@ +target_triplet = @target@ +subdir = kat/src/language +DIST_COMMON = $(srcdir)/Makefile.am $(srcdir)/Makefile.in +ACLOCAL_M4 = $(top_srcdir)/aclocal.m4 +am__aclocal_m4_deps = $(top_srcdir)/acinclude.m4 \ + $(top_srcdir)/configure.in +am__configure_deps = $(am__aclocal_m4_deps) $(CONFIGURE_DEPENDENCIES) \ + $(ACLOCAL_M4) +mkinstalldirs = $(SHELL) $(top_srcdir)/admin/mkinstalldirs +CONFIG_HEADER = $(top_builddir)/config.h +CONFIG_CLEAN_FILES = +SOURCES = +DIST_SOURCES = +am__vpath_adj_setup = srcdirstrip=`echo "$(srcdir)" | sed 's|.|.|g'`; +am__vpath_adj = case $$p in \ + $(srcdir)/*) f=`echo "$$p" | sed "s|^$$srcdirstrip/||"`;; \ + *) f=$$p;; \ + esac; +am__strip_dir = `echo $$p | sed -e 's|^.*/||'`; +am__installdirs = "$(DESTDIR)$(languagedir)" +languageDATA_INSTALL = $(INSTALL_DATA) +DATA = $(language_DATA) +#>- DISTFILES = $(DIST_COMMON) $(DIST_SOURCES) $(TEXINFOS) $(EXTRA_DIST) +#>+ 1 +DISTFILES = $(DIST_COMMON) $(DIST_SOURCES) $(TEXINFOS) $(EXTRA_DIST) $(KDE_DIST) +ACLOCAL = @ACLOCAL@ +AMDEP_FALSE = @AMDEP_FALSE@ +AMDEP_TRUE = @AMDEP_TRUE@ +AMTAR = @AMTAR@ +AR = @AR@ +ARTSCCONFIG = @ARTSCCONFIG@ +AUTOCONF = @AUTOCONF@ +AUTODIRS = @AUTODIRS@ +AUTOHEADER = @AUTOHEADER@ +AUTOMAKE = @AUTOMAKE@ +AWK = @AWK@ +CC = @CC@ +CCDEPMODE = @CCDEPMODE@ +CFLAGS = @CFLAGS@ +CONF_FILES = @CONF_FILES@ +CPP = @CPP@ +CPPFLAGS = @CPPFLAGS@ +CXX = @CXX@ +CXXCPP = @CXXCPP@ +CXXDEPMODE = @CXXDEPMODE@ +CXXFLAGS = @CXXFLAGS@ +CYGPATH_W = @CYGPATH_W@ +DCOPIDL = @DCOPIDL@ +DCOPIDL2CPP = @DCOPIDL2CPP@ +DCOPIDLNG = @DCOPIDLNG@ +DCOP_DEPENDENCIES = @DCOP_DEPENDENCIES@ +DEFS = @DEFS@ +DEPDIR = @DEPDIR@ +DOXYGEN = @DOXYGEN@ +DOXYGEN_PROJECT_NAME = @DOXYGEN_PROJECT_NAME@ +DOXYGEN_PROJECT_NUMBER = @DOXYGEN_PROJECT_NUMBER@ +ECHO = @ECHO@ +ECHO_C = @ECHO_C@ +ECHO_N = @ECHO_N@ +ECHO_T = @ECHO_T@ +EGREP = @EGREP@ +ENABLE_PERMISSIVE_FLAG = @ENABLE_PERMISSIVE_FLAG@ +EXEEXT = @EXEEXT@ +F77 = @F77@ +FFLAGS = @FFLAGS@ +FRAMEWORK_COREAUDIO = @FRAMEWORK_COREAUDIO@ +GMSGFMT = @GMSGFMT@ +HAVE_ATTR_H = @HAVE_ATTR_H@ +HAVE_GCC_VISIBILITY = @HAVE_GCC_VISIBILITY@ +INSTALL_DATA = @INSTALL_DATA@ +INSTALL_PROGRAM = @INSTALL_PROGRAM@ +INSTALL_SCRIPT = @INSTALL_SCRIPT@ +INSTALL_STRIP_PROGRAM = @INSTALL_STRIP_PROGRAM@ +KCFG_DEPENDENCIES = @KCFG_DEPENDENCIES@ +KCONFIG_COMPILER = @KCONFIG_COMPILER@ +KDECONFIG = @KDECONFIG@ +KDE_CHECK_PLUGIN = @KDE_CHECK_PLUGIN@ +KDE_EXTRA_RPATH = @KDE_EXTRA_RPATH@ +KDE_HAS_DOXYGEN = @KDE_HAS_DOXYGEN@ +KDE_HAVE_DOT = @KDE_HAVE_DOT@ +KDE_INCLUDES = @KDE_INCLUDES@ +KDE_INSTALLED_FALSE = @KDE_INSTALLED_FALSE@ +KDE_INSTALLED_TRUE = @KDE_INSTALLED_TRUE@ +KDE_LDFLAGS = @KDE_LDFLAGS@ +KDE_MT_LDFLAGS = @KDE_MT_LDFLAGS@ +KDE_MT_LIBS = @KDE_MT_LIBS@ +KDE_NO_UNDEFINED = @KDE_NO_UNDEFINED@ +KDE_PLUGIN = @KDE_PLUGIN@ +KDE_RPATH = @KDE_RPATH@ +KDE_USE_CLOSURE_FALSE = @KDE_USE_CLOSURE_FALSE@ +KDE_USE_CLOSURE_TRUE = @KDE_USE_CLOSURE_TRUE@ +KDE_USE_FINAL_FALSE = @KDE_USE_FINAL_FALSE@ +KDE_USE_FINAL_TRUE = @KDE_USE_FINAL_TRUE@ +KDE_USE_FPIE = @KDE_USE_FPIE@ +KDE_USE_NMCHECK_FALSE = @KDE_USE_NMCHECK_FALSE@ +KDE_USE_NMCHECK_TRUE = @KDE_USE_NMCHECK_TRUE@ +KDE_USE_PIE = @KDE_USE_PIE@ +KDE_XSL_STYLESHEET = @KDE_XSL_STYLESHEET@ +LDFLAGS = @LDFLAGS@ +LDFLAGS_AS_NEEDED = @LDFLAGS_AS_NEEDED@ +LDFLAGS_NEW_DTAGS = @LDFLAGS_NEW_DTAGS@ +LEX = @LEX@ +LEXLIB = @LEXLIB@ +LEX_OUTPUT_ROOT = @LEX_OUTPUT_ROOT@ +LFLAGS = @LFLAGS@ +LIBCOMPAT = @LIBCOMPAT@ +LIBCRYPT = @LIBCRYPT@ +LIBDL = @LIBDL@ +LIBJPEG = @LIBJPEG@ +LIBOBJS = @LIBOBJS@ +LIBPNG = @LIBPNG@ +LIBPTHREAD = @LIBPTHREAD@ +LIBRESOLV = @LIBRESOLV@ +LIBS = @LIBS@ +LIBSM = @LIBSM@ +LIBSOCKET = @LIBSOCKET@ +LIBTOOL = @LIBTOOL@ +LIBUCB = @LIBUCB@ +LIBUTIL = @LIBUTIL@ +LIBZ = @LIBZ@ +LIB_KAB = @LIB_KAB@ +LIB_KABC = @LIB_KABC@ +LIB_KDECORE = @LIB_KDECORE@ +LIB_KDED = @LIB_KDED@ +LIB_KDEPIM = @LIB_KDEPIM@ +LIB_KDEPRINT = @LIB_KDEPRINT@ +LIB_KDEUI = @LIB_KDEUI@ +LIB_KDNSSD = @LIB_KDNSSD@ +LIB_KFILE = @LIB_KFILE@ +LIB_KFM = @LIB_KFM@ +LIB_KHTML = @LIB_KHTML@ +LIB_KIMPROXY = @LIB_KIMPROXY@ +LIB_KIO = @LIB_KIO@ +LIB_KJS = @LIB_KJS@ +LIB_KNEWSTUFF = @LIB_KNEWSTUFF@ +LIB_KPARTS = @LIB_KPARTS@ +LIB_KSPELL = @LIB_KSPELL@ +LIB_KSYCOCA = @LIB_KSYCOCA@ +LIB_KUNITTEST = @LIB_KUNITTEST@ +LIB_KUTILS = @LIB_KUTILS@ +LIB_POLL = @LIB_POLL@ +LIB_QPE = @LIB_QPE@ +LIB_QT = @LIB_QT@ +LIB_SMB = @LIB_SMB@ +LIB_X11 = @LIB_X11@ +LIB_XEXT = @LIB_XEXT@ +LIB_XRENDER = @LIB_XRENDER@ +LN_S = @LN_S@ +LTLIBOBJS = @LTLIBOBJS@ +MAKEINFO = @MAKEINFO@ +MAKEKDEWIDGETS = @MAKEKDEWIDGETS@ +MCOPIDL = @MCOPIDL@ +MEINPROC = @MEINPROC@ +MOC = @MOC@ +MSGFMT = @MSGFMT@ +NOOPT_CFLAGS = @NOOPT_CFLAGS@ +NOOPT_CXXFLAGS = @NOOPT_CXXFLAGS@ +OBJEXT = @OBJEXT@ +PACKAGE = @PACKAGE@ +PACKAGE_BUGREPORT = @PACKAGE_BUGREPORT@ +PACKAGE_NAME = @PACKAGE_NAME@ +PACKAGE_STRING = @PACKAGE_STRING@ +PACKAGE_TARNAME = @PACKAGE_TARNAME@ +PACKAGE_VERSION = @PACKAGE_VERSION@ +PATH_SEPARATOR = @PATH_SEPARATOR@ +PERL = @PERL@ +QTDOCDIR = @QTDOCDIR@ +QTE_NORTTI = @QTE_NORTTI@ +QT_INCLUDES = @QT_INCLUDES@ +QT_LDFLAGS = @QT_LDFLAGS@ +RANLIB = @RANLIB@ +SET_MAKE = @SET_MAKE@ +SHELL = @SHELL@ +STRIP = @STRIP@ +TOPSUBDIRS = @TOPSUBDIRS@ +UIC = @UIC@ +UIC_TR = @UIC_TR@ +USER_INCLUDES = @USER_INCLUDES@ +USER_LDFLAGS = @USER_LDFLAGS@ +USE_EXCEPTIONS = @USE_EXCEPTIONS@ +USE_RTTI = @USE_RTTI@ +USE_THREADS = @USE_THREADS@ +VERSION = @VERSION@ +WOVERLOADED_VIRTUAL = @WOVERLOADED_VIRTUAL@ +XGETTEXT = @XGETTEXT@ +XMLLINT = @XMLLINT@ +X_EXTRA_LIBS = @X_EXTRA_LIBS@ +X_INCLUDES = @X_INCLUDES@ +X_LDFLAGS = @X_LDFLAGS@ +X_PRE_LIBS = @X_PRE_LIBS@ +X_RPATH = @X_RPATH@ +ac_ct_AR = @ac_ct_AR@ +ac_ct_CC = @ac_ct_CC@ +ac_ct_CXX = @ac_ct_CXX@ +ac_ct_F77 = @ac_ct_F77@ +ac_ct_RANLIB = @ac_ct_RANLIB@ +ac_ct_STRIP = @ac_ct_STRIP@ +all_includes = @all_includes@ +all_libraries = @all_libraries@ +am__fastdepCC_FALSE = @am__fastdepCC_FALSE@ +am__fastdepCC_TRUE = @am__fastdepCC_TRUE@ +am__fastdepCXX_FALSE = @am__fastdepCXX_FALSE@ +am__fastdepCXX_TRUE = @am__fastdepCXX_TRUE@ +am__include = @am__include@ +am__leading_dot = @am__leading_dot@ +am__quote = @am__quote@ +am__tar = @am__tar@ +am__untar = @am__untar@ +bindir = @bindir@ +build = @build@ +build_alias = @build_alias@ +build_cpu = @build_cpu@ +build_os = @build_os@ +build_vendor = @build_vendor@ +datadir = @datadir@ +exec_prefix = @exec_prefix@ +host = @host@ +host_alias = @host_alias@ +host_cpu = @host_cpu@ +host_os = @host_os@ +host_vendor = @host_vendor@ +include_ARTS_FALSE = @include_ARTS_FALSE@ +include_ARTS_TRUE = @include_ARTS_TRUE@ +include_x11_FALSE = @include_x11_FALSE@ +include_x11_TRUE = @include_x11_TRUE@ +includedir = @includedir@ +infodir = @infodir@ +install_sh = @install_sh@ +kat_SUBDIR_included_FALSE = @kat_SUBDIR_included_FALSE@ +kat_SUBDIR_included_TRUE = @kat_SUBDIR_included_TRUE@ +kde_appsdir = @kde_appsdir@ +kde_bindir = @kde_bindir@ +kde_confdir = @kde_confdir@ +kde_datadir = @kde_datadir@ +kde_htmldir = @kde_htmldir@ +kde_icondir = @kde_icondir@ +kde_includes = @kde_includes@ +kde_kcfgdir = @kde_kcfgdir@ +kde_libraries = @kde_libraries@ +kde_libs_htmldir = @kde_libs_htmldir@ +kde_libs_prefix = @kde_libs_prefix@ +kde_locale = @kde_locale@ +kde_mimedir = @kde_mimedir@ +kde_moduledir = @kde_moduledir@ +kde_qtver = @kde_qtver@ +kde_servicesdir = @kde_servicesdir@ +kde_servicetypesdir = @kde_servicetypesdir@ +kde_sounddir = @kde_sounddir@ +kde_styledir = @kde_styledir@ +kde_templatesdir = @kde_templatesdir@ +kde_wallpaperdir = @kde_wallpaperdir@ +kde_widgetdir = @kde_widgetdir@ +kdeinitdir = @kdeinitdir@ +libdir = @libdir@ +libexecdir = @libexecdir@ +localstatedir = @localstatedir@ +mandir = @mandir@ +mkdir_p = @mkdir_p@ +oldincludedir = @oldincludedir@ +po_SUBDIR_included_FALSE = @po_SUBDIR_included_FALSE@ +po_SUBDIR_included_TRUE = @po_SUBDIR_included_TRUE@ +prefix = @prefix@ +program_transform_name = @program_transform_name@ +qt_includes = @qt_includes@ +qt_libraries = @qt_libraries@ +sbindir = @sbindir@ +sharedstatedir = @sharedstatedir@ +sysconfdir = @sysconfdir@ +target = @target@ +target_alias = @target_alias@ +target_cpu = @target_cpu@ +target_os = @target_os@ +target_vendor = @target_vendor@ +unsermake_enable_pch_FALSE = @unsermake_enable_pch_FALSE@ +unsermake_enable_pch_TRUE = @unsermake_enable_pch_TRUE@ +x_includes = @x_includes@ +x_libraries = @x_libraries@ +xdg_appsdir = @xdg_appsdir@ +xdg_directorydir = @xdg_directorydir@ +xdg_menudir = @xdg_menudir@ +languagedir = $(kde_datadir)/kat/language +language_DATA = afrikaans.klp albanian.klp arabic2.klp arabic.klp armenian.klp \ + basque.klp belarus.klp bosnian.klp breton.klp bulgarian.klp catalan.klp \ + chinese1.klp chinese2.klp chinese.klp croatian.klp czech.klp danish.klp dutch.klp \ + english.klp esperanto.klp estonian.klp finnish.klp french.klp frisian.klp \ + georgian.klp german.klp greek.klp hawaian.klp hebrew.klp hindi.klp hungarian.klp \ + icelandic.klp indonesian.klp irish.klp italian.klp japanese-euc_jp.klp \ + japanese-shift_jis.klp korean.klp latin.klp latvian.klp lithuanian.klp malay.klp \ + manx.klp marathi.klp mf.klp middle-frisian.klp mingo.klp nepali.klp norwegian.klp \ + persian.klp polish.klp portuguese.klp quechua.klp romanian.klp rumantsch.klp \ + russian1.klp russian2.klp russian.klp sanskrit.klp scots_gaelic.klp scots.klp \ + serbian.klp slovak2.klp slovak.klp slovenian2.klp slovenian.klp spanish.klp \ + swahili.klp tagalog.klp tamil.klp thai.klp turkish.klp ukrainian.klp \ + vietnamese.klp welsh.klp + +#>- all: all-am +#>+ 1 +all: docs-am all-am + +.SUFFIXES: +$(srcdir)/Makefile.in: $(srcdir)/Makefile.am $(am__configure_deps) +#>- @for dep in $?; do \ +#>- case '$(am__configure_deps)' in \ +#>- *$$dep*) \ +#>- cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh \ +#>- && exit 0; \ +#>- exit 1;; \ +#>- esac; \ +#>- done; \ +#>- echo ' cd $(top_srcdir) && $(AUTOMAKE) --gnu kat/src/language/Makefile'; \ +#>- cd $(top_srcdir) && \ +#>- $(AUTOMAKE) --gnu kat/src/language/Makefile +#>+ 12 + @for dep in $?; do \ + case '$(am__configure_deps)' in \ + *$$dep*) \ + cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh \ + && exit 0; \ + exit 1;; \ + esac; \ + done; \ + echo ' cd $(top_srcdir) && $(AUTOMAKE) --gnu kat/src/language/Makefile'; \ + cd $(top_srcdir) && \ + $(AUTOMAKE) --gnu kat/src/language/Makefile + cd $(top_srcdir) && perl admin/am_edit kat/src/language/Makefile.in +.PRECIOUS: Makefile +Makefile: $(srcdir)/Makefile.in $(top_builddir)/config.status + @case '$?' in \ + *config.status*) \ + cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh;; \ + *) \ + echo ' cd $(top_builddir) && $(SHELL) ./config.status $(subdir)/$@ $(am__depfiles_maybe)'; \ + cd $(top_builddir) && $(SHELL) ./config.status $(subdir)/$@ $(am__depfiles_maybe);; \ + esac; + +$(top_builddir)/config.status: $(top_srcdir)/configure $(CONFIG_STATUS_DEPENDENCIES) + cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh + +$(top_srcdir)/configure: $(am__configure_deps) + cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh +$(ACLOCAL_M4): $(am__aclocal_m4_deps) + cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh + +mostlyclean-libtool: + -rm -f *.lo + +clean-libtool: + -rm -rf .libs _libs + +distclean-libtool: + -rm -f libtool +uninstall-info-am: +install-languageDATA: $(language_DATA) + @$(NORMAL_INSTALL) + test -z "$(languagedir)" || $(mkdir_p) "$(DESTDIR)$(languagedir)" + @list='$(language_DATA)'; for p in $$list; do \ + if test -f "$$p"; then d=; else d="$(srcdir)/"; fi; \ + f=$(am__strip_dir) \ + echo " $(languageDATA_INSTALL) '$$d$$p' '$(DESTDIR)$(languagedir)/$$f'"; \ + $(languageDATA_INSTALL) "$$d$$p" "$(DESTDIR)$(languagedir)/$$f"; \ + done + +uninstall-languageDATA: + @$(NORMAL_UNINSTALL) + @list='$(language_DATA)'; for p in $$list; do \ + f=$(am__strip_dir) \ + echo " rm -f '$(DESTDIR)$(languagedir)/$$f'"; \ + rm -f "$(DESTDIR)$(languagedir)/$$f"; \ + done +tags: TAGS +TAGS: + +ctags: CTAGS +CTAGS: + + +distdir: $(DISTFILES) + @srcdirstrip=`echo "$(srcdir)" | sed 's|.|.|g'`; \ + topsrcdirstrip=`echo "$(top_srcdir)" | sed 's|.|.|g'`; \ + list='$(DISTFILES)'; for file in $$list; do \ + case $$file in \ + $(srcdir)/*) file=`echo "$$file" | sed "s|^$$srcdirstrip/||"`;; \ + $(top_srcdir)/*) file=`echo "$$file" | sed "s|^$$topsrcdirstrip/|$(top_builddir)/|"`;; \ + esac; \ + if test -f $$file || test -d $$file; then d=.; else d=$(srcdir); fi; \ + dir=`echo "$$file" | sed -e 's,/[^/]*$$,,'`; \ + if test "$$dir" != "$$file" && test "$$dir" != "."; then \ + dir="/$$dir"; \ + $(mkdir_p) "$(distdir)$$dir"; \ + else \ + dir=''; \ + fi; \ + if test -d $$d/$$file; then \ + if test -d $(srcdir)/$$file && test $$d != $(srcdir); then \ + cp -pR $(srcdir)/$$file $(distdir)$$dir || exit 1; \ + fi; \ + cp -pR $$d/$$file $(distdir)$$dir || exit 1; \ + else \ + test -f $(distdir)/$$file \ + || cp -p $$d/$$file $(distdir)/$$file \ + || exit 1; \ + fi; \ + done +check-am: all-am +check: check-am +all-am: Makefile $(DATA) +installdirs: + for dir in "$(DESTDIR)$(languagedir)"; do \ + test -z "$$dir" || $(mkdir_p) "$$dir"; \ + done +install: install-am +install-exec: install-exec-am +install-data: install-data-am +uninstall: uninstall-am + +install-am: all-am + @$(MAKE) $(AM_MAKEFLAGS) install-exec-am install-data-am + +installcheck: installcheck-am +install-strip: + $(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \ + install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \ + `test -z '$(STRIP)' || \ + echo "INSTALL_PROGRAM_ENV=STRIPPROG='$(STRIP)'"` install +mostlyclean-generic: + +clean-generic: + +distclean-generic: + -test -z "$(CONFIG_CLEAN_FILES)" || rm -f $(CONFIG_CLEAN_FILES) + +maintainer-clean-generic: + @echo "This command is intended for maintainers to use" + @echo "it deletes files that may require special tools to rebuild." +#>- clean: clean-am +#>+ 1 +clean: kde-rpo-clean clean-am + +#>- clean-am: clean-generic clean-libtool mostlyclean-am +#>+ 1 +clean-am: clean-bcheck clean-generic clean-libtool mostlyclean-am + +distclean: distclean-am + -rm -f Makefile +distclean-am: clean-am distclean-generic distclean-libtool + +dvi: dvi-am + +dvi-am: + +html: html-am + +info: info-am + +info-am: + +install-data-am: install-languageDATA + +install-exec-am: + +install-info: install-info-am + +install-man: + +installcheck-am: + +maintainer-clean: maintainer-clean-am + -rm -f Makefile +maintainer-clean-am: distclean-am maintainer-clean-generic + +mostlyclean: mostlyclean-am + +mostlyclean-am: mostlyclean-generic mostlyclean-libtool + +pdf: pdf-am + +pdf-am: + +ps: ps-am + +ps-am: + +uninstall-am: uninstall-info-am uninstall-languageDATA + +.PHONY: all all-am check check-am clean clean-generic clean-libtool \ + distclean distclean-generic distclean-libtool distdir dvi \ + dvi-am html html-am info info-am install install-am \ + install-data install-data-am install-exec install-exec-am \ + install-info install-info-am install-languageDATA install-man \ + install-strip installcheck installcheck-am installdirs \ + maintainer-clean maintainer-clean-generic mostlyclean \ + mostlyclean-generic mostlyclean-libtool pdf pdf-am ps ps-am \ + uninstall uninstall-am uninstall-info-am \ + uninstall-languageDATA + +# Tell versions [3.59,3.63) of GNU make to not export all variables. +# Otherwise a system limit (for SysV at least) may be exceeded. +.NOEXPORT: + +#>+ 2 +KDE_DIST=czech.klp ukrainian.klp rumantsch.klp latvian.klp chinese2.klp scots.klp tagalog.klp manx.klp slovak2.klp spanish.klp malay.klp latin.klp icelandic.klp welsh.klp finnish.klp indonesian.klp hebrew.klp hawaian.klp japanese-shift_jis.klp irish.klp bosnian.klp russian2.klp albanian.klp nepali.klp hindi.klp serbian.klp tamil.klp swahili.klp portuguese.klp georgian.klp catalan.klp turkish.klp hungarian.klp sanskrit.klp mf.klp dutch.klp belarus.klp korean.klp slovak.klp chinese.klp vietnamese.klp english.klp german.klp frisian.klp greek.klp scots_gaelic.klp slovenian2.klp breton.klp thai.klp danish.klp esperanto.klp middle-frisian.klp slovenian.klp arabic2.klp persian.klp armenian.klp norwegian.klp quechua.klp russian.klp basque.klp mingo.klp chinese1.klp japanese-euc_jp.klp french.klp Makefile.in lithuanian.klp croatian.klp romanian.klp russian1.klp marathi.klp afrikaans.klp bulgarian.klp Makefile.am arabic.klp italian.klp estonian.klp polish.klp + +#>+ 2 +docs-am: + +#>+ 15 +force-reedit: + @for dep in $?; do \ + case '$(am__configure_deps)' in \ + *$$dep*) \ + cd $(top_builddir) && $(MAKE) $(AM_MAKEFLAGS) am--refresh \ + && exit 0; \ + exit 1;; \ + esac; \ + done; \ + echo ' cd $(top_srcdir) && $(AUTOMAKE) --gnu kat/src/language/Makefile'; \ + cd $(top_srcdir) && \ + $(AUTOMAKE) --gnu kat/src/language/Makefile + cd $(top_srcdir) && perl admin/am_edit kat/src/language/Makefile.in + + +#>+ 21 +clean-bcheck: + rm -f *.bchecktest.cc *.bchecktest.cc.class a.out + +bcheck: bcheck-am + +bcheck-am: + @for i in ; do \ + if test $(srcdir)/$$i -nt $$i.bchecktest.cc; then \ + echo "int main() {return 0;}" > $$i.bchecktest.cc ; \ + echo "#include \"$$i\"" >> $$i.bchecktest.cc ; \ + echo "$$i"; \ + if ! $(CXX) $(DEFS) -I. -I$(srcdir) -I$(top_builddir) $(INCLUDES) $(AM_CPPFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(KDE_CXXFLAGS) --dump-class-hierarchy -c $$i.bchecktest.cc; then \ + rm -f $$i.bchecktest.cc; exit 1; \ + fi ; \ + echo "" >> $$i.bchecktest.cc.class; \ + perl $(top_srcdir)/admin/bcheck.pl $$i.bchecktest.cc.class || { rm -f $$i.bchecktest.cc; exit 1; }; \ + rm -f a.out; \ + fi ; \ + done + + +#>+ 3 +final: + $(MAKE) all-am + +#>+ 3 +final-install: + $(MAKE) install-am + +#>+ 3 +no-final: + $(MAKE) all-am + +#>+ 3 +no-final-install: + $(MAKE) install-am + +#>+ 3 +kde-rpo-clean: + -rm -f *.rpo + +#>+ 3 +nmcheck: +nmcheck-am: nmcheck diff --git a/src/plugins/language/afrikaans.klp b/src/plugins/language/afrikaans.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="884" value="_" /> + <ngram occurrences="619" value="e" /> + <ngram occurrences="335" value="a" /> + <ngram occurrences="311" value="n" /> + <ngram occurrences="283" value="i" /> + <ngram occurrences="236" value="o" /> + <ngram occurrences="228" value="r" /> + <ngram occurrences="213" value="s" /> + <ngram occurrences="208" value="t" /> + <ngram occurrences="198" value="d" /> + <ngram occurrences="182" value="e_" /> + <ngram occurrences="132" value="m" /> + <ngram occurrences="127" value="l" /> + <ngram occurrences="126" value="g" /> + <ngram occurrences="125" value="k" /> + <ngram occurrences="124" value="n_" /> + <ngram occurrences="123" value="ie" /> + <ngram occurrences="106" value="t_" /> + <ngram occurrences="105" value="h" /> + <ngram occurrences="98" value="ie_" /> + <ngram occurrences="95" value="_h" /> + <ngram occurrences="89" value="_d" /> + <ngram occurrences="85" value="s_" /> + <ngram occurrences="85" value="er" /> + <ngram occurrences="83" value="y" /> + <ngram occurrences="83" value="v" /> + <ngram occurrences="83" value="an" /> + <ngram occurrences="78" value="w" /> + <ngram occurrences="76" value="r_" /> + <ngram occurrences="75" value="di" /> + <ngram occurrences="75" value="aa" /> + <ngram occurrences="73" value="_n" /> + <ngram occurrences="72" value="_v" /> + <ngram occurrences="71" value="_s" /> + <ngram occurrences="68" value="en" /> + <ngram occurrences="65" value="y_" /> + <ngram occurrences="64" value="_m" /> + <ngram occurrences="64" value="_di" /> + <ngram occurrences="60" value="ge" /> + <ngram occurrences="59" value="u" /> + <ngram occurrences="55" value="b" /> + <ngram occurrences="54" value="et" /> + <ngram occurrences="54" value="_w" /> + <ngram occurrences="54" value="_e" /> + <ngram occurrences="52" value="die" /> + <ngram occurrences="50" value="et_" /> + <ngram occurrences="50" value="die_" /> + <ngram occurrences="49" value="_o" /> + <ngram occurrences="49" value="_die" /> + <ngram occurrences="48" value="te" /> + <ngram occurrences="48" value="in" /> + <ngram occurrences="48" value="_die_" /> + <ngram occurrences="47" value="ni" /> + <ngram occurrences="47" value="ee" /> + <ngram occurrences="46" value="k_" /> + <ngram occurrences="46" value="an_" /> + <ngram occurrences="44" value="p" /> + <ngram occurrences="42" value="de" /> + <ngram occurrences="42" value="_a" /> + <ngram occurrences="41" value="_g" /> + <ngram occurrences="39" value="g_" /> + <ngram occurrences="39" value="d_" /> + <ngram occurrences="38" value="er_" /> + <ngram occurrences="37" value="en_" /> + <ngram occurrences="36" value="nd" /> + <ngram occurrences="36" value="ar" /> + <ngram occurrences="35" value="wa" /> + <ngram occurrences="35" value="nie" /> + <ngram occurrences="35" value="he" /> + <ngram occurrences="35" value="el" /> + <ngram occurrences="35" value="at" /> + <ngram occurrences="35" value="_i" /> + <ngram occurrences="34" value="oo" /> + <ngram occurrences="34" value="oe" /> + <ngram occurrences="34" value="nie_" /> + <ngram occurrences="34" value="_ni" /> + <ngram occurrences="33" value="m_" /> + <ngram occurrences="33" value="ek" /> + <ngram occurrences="33" value="_wa" /> + <ngram occurrences="33" value="_nie_" /> + <ngram occurrences="33" value="_nie" /> + <ngram occurrences="33" value="_he" /> + <ngram occurrences="32" value="_b" /> + <ngram occurrences="31" value="_en" /> + <ngram occurrences="30" value="_k" /> + <ngram occurrences="30" value="_ge" /> + <ngram occurrences="29" value="om" /> + <ngram occurrences="29" value="me" /> + <ngram occurrences="29" value="ma" /> + <ngram occurrences="29" value="_t" /> + <ngram occurrences="28" value="va" /> + <ngram occurrences="28" value="l_" /> + <ngram occurrences="28" value="aan" /> + <ngram occurrences="27" value="is" /> + <ngram occurrences="27" value="at_" /> + <ngram occurrences="26" value="on" /> + <ngram occurrences="26" value="hy_" /> + <ngram occurrences="26" value="hy" /> + <ngram occurrences="26" value="f" /> + <ngram occurrences="26" value="_hy_" /> + <ngram occurrences="26" value="_hy" /> + <ngram occurrences="25" value="or" /> + <ngram occurrences="25" value="n_d" /> + <ngram occurrences="25" value="_en_" /> + <ngram occurrences="24" value="it" /> + <ngram occurrences="24" value="het_" /> + <ngram occurrences="24" value="het" /> + <ngram occurrences="24" value="es" /> + <ngram occurrences="24" value="as" /> + <ngram occurrences="24" value="aar" /> + <ngram occurrences="24" value="_het_" /> + <ngram occurrences="24" value="_het" /> + <ngram occurrences="23" value="van" /> + <ngram occurrences="23" value="te_" /> + <ngram occurrences="23" value="om_" /> + <ngram occurrences="23" value="e_m" /> + <ngram occurrences="23" value="da" /> + <ngram occurrences="22" value="ra" /> + <ngram occurrences="22" value="ou" /> + <ngram occurrences="22" value="li" /> + <ngram occurrences="22" value="_ma" /> + <ngram occurrences="21" value="ek_" /> + <ngram occurrences="21" value="be" /> + <ngram occurrences="21" value="al" /> + <ngram occurrences="21" value="_va" /> + <ngram occurrences="20" value="sy_" /> + <ngram occurrences="20" value="sy" /> + <ngram occurrences="20" value="rd" /> + <ngram occurrences="20" value="ng" /> + <ngram occurrences="20" value="as_" /> + <ngram occurrences="20" value="_sy_" /> + <ngram occurrences="20" value="_sy" /> + <ngram occurrences="19" value="we" /> + <ngram occurrences="19" value="st" /> + <ngram occurrences="19" value="ke" /> + <ngram occurrences="19" value="is_" /> + <ngram occurrences="19" value="ar_" /> + <ngram occurrences="19" value="aar_" /> + <ngram occurrences="19" value="_van" /> + <ngram occurrences="18" value="van_" /> + <ngram occurrences="18" value="se" /> + <ngram occurrences="18" value="n_di" /> + <ngram occurrences="18" value="it_" /> + <ngram occurrences="18" value="in_" /> + <ngram occurrences="18" value="ag" /> + <ngram occurrences="18" value="_me" /> + <ngram occurrences="17" value="ro" /> + <ngram occurrences="17" value="re" /> + <ngram occurrences="17" value="le" /> + <ngram occurrences="17" value="ho" /> + <ngram occurrences="17" value="ei" /> + <ngram occurrences="17" value="der" /> + <ngram occurrences="17" value="and" /> + <ngram occurrences="17" value="aan_" /> + <ngram occurrences="17" value="_van_" /> + <ngram occurrences="17" value="_in" /> + <ngram occurrences="16" value="u_" /> + <ngram occurrences="16" value="ou_" /> + <ngram occurrences="16" value="nde" /> + <ngram occurrences="16" value="ko" /> + <ngram occurrences="16" value="ie_m" /> + <ngram occurrences="16" value="e_s" /> + <ngram occurrences="16" value="e_h" /> + <ngram occurrences="16" value="_be" /> + <ngram occurrences="15" value="so" /> + <ngram occurrences="15" value="rs" /> + <ngram occurrences="15" value="op" /> + <ngram occurrences="15" value="ns" /> + <ngram occurrences="15" value="mo" /> + <ngram occurrences="15" value="maa" /> + <ngram occurrences="15" value="ik" /> + <ngram occurrences="15" value="ig" /> + <ngram occurrences="15" value="em" /> + <ngram occurrences="15" value="e_v" /> + <ngram occurrences="15" value="_te" /> + <ngram occurrences="15" value="_n_" /> + <ngram occurrences="14" value="vo" /> + <ngram occurrences="14" value="vi" /> + <ngram occurrences="14" value="ve" /> + <ngram occurrences="14" value="t_d" /> + <ngram occurrences="14" value="si" /> + <ngram occurrences="14" value="nt" /> + <ngram occurrences="14" value="n_die" /> + <ngram occurrences="14" value="ha" /> + <ngram occurrences="14" value="_vi" /> + <ngram occurrences="14" value="_te_" /> + <ngram occurrences="14" value="_mo" /> + <ngram occurrences="14" value="_is_" /> + <ngram occurrences="14" value="_is" /> + <ngram occurrences="14" value="_in_" /> + <ngram occurrences="14" value="_ek_" /> + <ngram occurrences="14" value="_ek" /> + <ngram occurrences="14" value="_da" /> + <ngram occurrences="13" value="wo" /> + <ngram occurrences="13" value="wat" /> + <ngram occurrences="13" value="t_di" /> + <ngram occurrences="13" value="rt" /> + <ngram occurrences="13" value="r_h" /> + <ngram occurrences="13" value="no" /> + <ngram occurrences="13" value="j" /> + <ngram occurrences="13" value="eer" /> + <ngram occurrences="13" value="e_o" /> + <ngram occurrences="13" value="ag_" /> + <ngram occurrences="13" value="_wat" /> + <ngram occurrences="13" value="_vo" /> + <ngram occurrences="13" value="_ve" /> + <ngram occurrences="13" value="_p" /> + <ngram occurrences="13" value="_on" /> + <ngram occurrences="13" value="_maa" /> + <ngram occurrences="13" value="_ha" /> + <ngram occurrences="12" value="wat_" /> + <ngram occurrences="12" value="was_" /> + <ngram occurrences="12" value="was" /> + <ngram occurrences="12" value="ver" /> + <ngram occurrences="12" value="t_die" /> + <ngram occurrences="12" value="sk" /> + <ngram occurrences="12" value="s_h" /> + <ngram occurrences="12" value="p_" /> + <ngram occurrences="12" value="ne" /> + <ngram occurrences="12" value="n_s" /> + <ngram occurrences="12" value="n_k" /> + <ngram occurrences="12" value="moe" /> + <ngram occurrences="12" value="ing" /> + <ngram occurrences="12" value="f_" /> + <ngram occurrences="12" value="el_" /> + <ngram occurrences="12" value="e_g" /> + <ngram occurrences="12" value="e_d" /> + <ngram occurrences="12" value="bl" /> + <ngram occurrences="12" value="al_" /> + <ngram occurrences="12" value="_wat_" /> + <ngram occurrences="12" value="_was_" /> + <ngram occurrences="12" value="_was" /> + <ngram occurrences="12" value="_so" /> + <ngram occurrences="12" value="_om_" /> + <ngram occurrences="12" value="_om" /> + <ngram occurrences="12" value="_ko" /> + <ngram occurrences="12" value="_aan" /> + <ngram occurrences="12" value="_aa" /> + <ngram occurrences="11" value="vr" /> + <ngram occurrences="11" value="vir_" /> + <ngram occurrences="11" value="vir" /> + <ngram occurrences="11" value="to" /> + <ngram occurrences="11" value="ta" /> + <ngram occurrences="11" value="t_h" /> + <ngram occurrences="11" value="s_v" /> + <ngram occurrences="11" value="rd_" /> + <ngram occurrences="11" value="ord" /> + <ngram occurrences="11" value="op_" /> + <ngram occurrences="11" value="oor" /> + <ngram occurrences="11" value="n_n" /> + <ngram occurrences="11" value="met" /> + <ngram occurrences="11" value="maar_" /> + <ngram occurrences="11" value="maar" /> + <ngram occurrences="11" value="ka" /> + <ngram occurrences="11" value="ir_" /> + <ngram occurrences="11" value="ir" /> + <ngram occurrences="11" value="ie_s" /> + <ngram occurrences="11" value="ew" /> + <ngram occurrences="11" value="ers" /> + <ngram occurrences="11" value="ed" /> + <ngram occurrences="11" value="de_" /> + <ngram occurrences="11" value="_vir_" /> + <ngram occurrences="11" value="_vir" /> + <ngram occurrences="11" value="_ver" /> + <ngram occurrences="11" value="_no" /> + <ngram occurrences="11" value="_moe" /> + <ngram occurrences="11" value="_maar" /> + <ngram occurrences="11" value="_ho" /> + <ngram occurrences="11" value="_al" /> + <ngram occurrences="10" value="ui" /> + <ngram occurrences="10" value="t_n" /> + <ngram occurrences="10" value="sta" /> + <ngram occurrences="10" value="sie" /> + <ngram occurrences="10" value="ri" /> + <ngram occurrences="10" value="raa" /> + <ngram occurrences="10" value="nge" /> + <ngram occurrences="10" value="nder" /> + <ngram occurrences="10" value="nd_" /> + <ngram occurrences="10" value="n_m" /> + <ngram occurrences="10" value="met_" /> + <ngram occurrences="10" value="man" /> + <ngram occurrences="10" value="lik" /> + <ngram occurrences="10" value="en_d" /> + <ngram occurrences="10" value="e_w" /> + <ngram occurrences="10" value="e_n" /> + <ngram occurrences="10" value="_vr" /> + <ngram occurrences="10" value="_se" /> + <ngram occurrences="10" value="_op" /> + <ngram occurrences="10" value="_met_" /> + <ngram occurrences="10" value="_met" /> + <ngram occurrences="10" value="_j" /> + <ngram occurrences="9" value="t_v" /> + <ngram occurrences="9" value="t_nie" /> + <ngram occurrences="9" value="t_ni" /> + <ngram occurrences="9" value="s_i" /> + <ngram occurrences="9" value="rs_" /> + <ngram occurrences="9" value="pr" /> + <ngram occurrences="9" value="ord_" /> + <ngram occurrences="9" value="og" /> + <ngram occurrences="9" value="nk" /> + <ngram occurrences="9" value="n_w" /> + <ngram occurrences="9" value="ll" /> + <ngram occurrences="9" value="ke_" /> + <ngram occurrences="9" value="ig_" /> + <ngram occurrences="9" value="ges" /> + <ngram occurrences="9" value="es_" /> + <ngram occurrences="9" value="eer_" /> + <ngram occurrences="9" value="a_" /> + <ngram occurrences="9" value="_to" /> + <ngram occurrences="9" value="_r" /> + <ngram occurrences="9" value="_l" /> + <ngram occurrences="8" value="word_" /> + <ngram occurrences="8" value="word" /> + <ngram occurrences="8" value="wor" /> + <ngram occurrences="8" value="taa" /> + <ngram occurrences="8" value="t_m" /> + <ngram occurrences="8" value="t_e" /> + <ngram occurrences="8" value="rte" /> + <ngram occurrences="8" value="r_s" /> + <ngram occurrences="8" value="r_n" /> + <ngram occurrences="8" value="r_e" /> + <ngram occurrences="8" value="r_d" /> + <ngram occurrences="8" value="pa" /> + <ngram occurrences="8" value="og_" /> + <ngram occurrences="8" value="oe_" /> + <ngram occurrences="8" value="ng_" /> + <ngram occurrences="8" value="na" /> + <ngram occurrences="8" value="n_h" /> + <ngram occurrences="8" value="my_" /> + <ngram occurrences="8" value="my" /> + <ngram occurrences="8" value="la" /> + <ngram occurrences="8" value="kl" /> + <ngram occurrences="8" value="k_h" /> + <ngram occurrences="8" value="ie_ma" /> + <ngram occurrences="8" value="hi" /> + <ngram occurrences="8" value="ge_" /> + <ngram occurrences="8" value="ga" /> + <ngram occurrences="8" value="ewe" /> + <ngram occurrences="8" value="eu" /> + <ngram occurrences="8" value="ers_" /> + <ngram occurrences="8" value="eg" /> + <ngram occurrences="8" value="een" /> + <ngram occurrences="8" value="e_ma" /> + <ngram occurrences="8" value="e_he" /> + <ngram occurrences="8" value="e_a" /> + <ngram occurrences="8" value="dit_" /> + <ngram occurrences="8" value="dit" /> + <ngram occurrences="8" value="din" /> + <ngram occurrences="8" value="die_m" /> + <ngram occurrences="8" value="ak" /> + <ngram occurrences="8" value="aat" /> + <ngram occurrences="8" value="_sk" /> + <ngram occurrences="8" value="_pr" /> + <ngram occurrences="8" value="_ne" /> + <ngram occurrences="8" value="_my_" /> + <ngram occurrences="8" value="_my" /> + <ngram occurrences="8" value="_hi" /> + <ngram occurrences="8" value="_dit_" /> + <ngram occurrences="8" value="_dit" /> + <ngram occurrences="7" value="wee" /> + <ngram occurrences="7" value="ur" /> + <ngram occurrences="7" value="uit" /> + <ngram occurrences="7" value="toe_" /> + <ngram occurrences="7" value="toe" /> + <ngram occurrences="7" value="tee" /> + <ngram occurrences="7" value="t_s" /> + <ngram occurrences="7" value="ste" /> + <ngram occurrences="7" value="staa" /> + <ngram occurrences="7" value="s_n" /> + <ngram occurrences="7" value="s_m" /> + <ngram occurrences="7" value="s_in" /> + <ngram occurrences="7" value="s_hy_" /> + <ngram occurrences="7" value="s_hy" /> + <ngram occurrences="7" value="s_d" /> + <ngram occurrences="7" value="oet_" /> + <ngram occurrences="7" value="oet" /> + <ngram occurrences="7" value="ns_" /> + <ngram occurrences="7" value="nda" /> + <ngram occurrences="7" value="n_v" /> + <ngram occurrences="7" value="n_e" /> + <ngram occurrences="7" value="lin" /> + <ngram occurrences="7" value="le_" /> + <ngram occurrences="7" value="ind" /> + <ngram occurrences="7" value="ik_" /> + <ngram occurrences="7" value="ier" /> + <ngram occurrences="7" value="ie_h" /> + <ngram occurrences="7" value="id" /> + <ngram occurrences="7" value="ger" /> + <ngram occurrences="7" value="gaan_" /> + <ngram occurrences="7" value="gaan" /> + <ngram occurrences="7" value="gaa" /> + <ngram occurrences="7" value="et_m" /> + <ngram occurrences="7" value="et_d" /> + <ngram occurrences="7" value="erd" /> + <ngram occurrences="7" value="end" /> + <ngram occurrences="7" value="e_vo" /> + <ngram occurrences="7" value="e_p" /> + <ngram occurrences="7" value="e_moe" /> + <ngram occurrences="7" value="e_mo" /> + <ngram occurrences="7" value="e_me" /> +</ngrams> diff --git a/src/plugins/language/albanian.klp b/src/plugins/language/albanian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="915" value="_" /> + <ngram occurrences="383" value="ë" /> + <ngram occurrences="378" value="e" /> + <ngram occurrences="356" value="t" /> + <ngram occurrences="308" value="i" /> + <ngram occurrences="279" value="r" /> + <ngram occurrences="267" value="a" /> + <ngram occurrences="244" value="n" /> + <ngram occurrences="225" value="s" /> + <ngram occurrences="214" value="ë_" /> + <ngram occurrences="187" value="h" /> + <ngram occurrences="182" value="e_" /> + <ngram occurrences="158" value="j" /> + <ngram occurrences="131" value="u" /> + <ngram occurrences="131" value="k" /> + <ngram occurrences="127" value="m" /> + <ngram occurrences="123" value="o" /> + <ngram occurrences="119" value="të" /> + <ngram occurrences="119" value="p" /> + <ngram occurrences="115" value="d" /> + <ngram occurrences="112" value="_t" /> + <ngram occurrences="98" value="të_" /> + <ngram occurrences="93" value="_n" /> + <ngram occurrences="89" value="sh" /> + <ngram occurrences="89" value="l" /> + <ngram occurrences="87" value="_p" /> + <ngram occurrences="84" value="_s" /> + <ngram occurrences="83" value="a_" /> + <ngram occurrences="78" value="i_" /> + <ngram occurrences="75" value="ër" /> + <ngram occurrences="74" value="te" /> + <ngram occurrences="71" value="_k" /> + <ngram occurrences="70" value="_m" /> + <ngram occurrences="67" value="g" /> + <ngram occurrences="64" value="r_" /> + <ngram occurrences="63" value="_të_" /> + <ngram occurrences="63" value="_të" /> + <ngram occurrences="54" value="te_" /> + <ngram occurrences="54" value="ht" /> + <ngram occurrences="52" value="t_" /> + <ngram occurrences="52" value="sht" /> + <ngram occurrences="52" value="_e" /> + <ngram occurrences="49" value="is" /> + <ngram occurrences="49" value="_e_" /> + <ngram occurrences="47" value="ri" /> + <ngram occurrences="47" value="n_" /> + <ngram occurrences="46" value="nd" /> + <ngram occurrences="45" value="v" /> + <ngram occurrences="45" value="he" /> + <ngram occurrences="45" value="_a" /> + <ngram occurrences="43" value="et" /> + <ngram occurrences="42" value="pë" /> + <ngram occurrences="41" value="q" /> + <ngram occurrences="41" value="për" /> + <ngram occurrences="41" value="me" /> + <ngram occurrences="41" value="b" /> + <ngram occurrences="41" value="_d" /> + <ngram occurrences="39" value="ish" /> + <ngram occurrences="38" value="_i" /> + <ngram occurrences="37" value="it" /> + <ngram occurrences="36" value="në" /> + <ngram occurrences="36" value="j_" /> + <ngram occurrences="35" value="ur" /> + <ngram occurrences="35" value="ar" /> + <ngram occurrences="34" value="in" /> + <ngram occurrences="34" value="_për" /> + <ngram occurrences="34" value="_pë" /> + <ngram occurrences="33" value="s_" /> + <ngram occurrences="33" value="en" /> + <ngram occurrences="32" value="rë" /> + <ngram occurrences="32" value="o_" /> + <ngram occurrences="32" value="isht" /> + <ngram occurrences="31" value="hte" /> + <ngram occurrences="31" value="_v" /> + <ngram occurrences="30" value="ë_t" /> + <ngram occurrences="30" value="z" /> + <ngram occurrences="30" value="shte" /> + <ngram occurrences="30" value="je" /> + <ngram occurrences="29" value="në_" /> + <ngram occurrences="29" value="f" /> + <ngram occurrences="29" value="dh" /> + <ngram occurrences="29" value="_me" /> + <ngram occurrences="28" value="jë" /> + <ngram occurrences="28" value="gj" /> + <ngram occurrences="28" value="ej" /> + <ngram occurrences="28" value="_b" /> + <ngram occurrences="27" value="ës" /> + <ngram occurrences="27" value="nj" /> + <ngram occurrences="27" value="at" /> + <ngram occurrences="26" value="u_" /> + <ngram occurrences="26" value="hte_" /> + <ngram occurrences="25" value="shte_" /> + <ngram occurrences="25" value="mi" /> + <ngram occurrences="25" value="er" /> + <ngram occurrences="24" value="ër_" /> + <ngram occurrences="24" value="ë_p" /> + <ngram occurrences="24" value="si" /> + <ngram occurrences="24" value="re" /> + <ngram occurrences="24" value="ra" /> + <ngram occurrences="24" value="ishte" /> + <ngram occurrences="24" value="in_" /> + <ngram occurrences="24" value="ej_" /> + <ngram occurrences="24" value="_sh" /> + <ngram occurrences="24" value="_në" /> + <ngram occurrences="23" value="ën" /> + <ngram occurrences="23" value="ti" /> + <ngram occurrences="23" value="kë" /> + <ngram occurrences="23" value="ku" /> + <ngram occurrences="23" value="_g" /> + <ngram occurrences="22" value="ta" /> + <ngram occurrences="22" value="pa" /> + <ngram occurrences="22" value="on" /> + <ngram occurrences="22" value="një" /> + <ngram occurrences="22" value="ni" /> + <ngram occurrences="22" value="me_" /> + <ngram occurrences="22" value="jë_" /> + <ngram occurrences="22" value="_q" /> + <ngram occurrences="21" value="ur_" /> + <ngram occurrences="21" value="th" /> + <ngram occurrences="21" value="se" /> + <ngram occurrences="21" value="es" /> + <ngram occurrences="21" value="e_t" /> + <ngram occurrences="21" value="e_m" /> + <ngram occurrences="21" value="do" /> + <ngram occurrences="21" value="as" /> + <ngram occurrences="21" value="_si" /> + <ngram occurrences="21" value="_në_" /> + <ngram occurrences="20" value="y" /> + <ngram occurrences="20" value="ve" /> + <ngram occurrences="20" value="ng" /> + <ngram occurrences="20" value="e_n" /> + <ngram occurrences="20" value="an" /> + <ngram occurrences="20" value="_pa" /> + <ngram occurrences="19" value="ë_k" /> + <ngram occurrences="19" value="ç" /> + <ngram occurrences="19" value="se_" /> + <ngram occurrences="19" value="po" /> + <ngram occurrences="19" value="ki" /> + <ngram occurrences="19" value="im" /> + <ngram occurrences="19" value="_i_" /> + <ngram occurrences="18" value="ë_n" /> + <ngram occurrences="18" value="nt" /> + <ngram occurrences="18" value="më" /> + <ngram occurrences="18" value="ll" /> + <ngram occurrences="18" value="ja" /> + <ngram occurrences="18" value="aj" /> + <ngram occurrences="18" value="_nj" /> + <ngram occurrences="18" value="_nd" /> + <ngram occurrences="18" value="_me_" /> + <ngram occurrences="18" value="_l" /> + <ngram occurrences="18" value="_f" /> + <ngram occurrences="17" value="ës_" /> + <ngram occurrences="17" value="ë_s" /> + <ngram occurrences="17" value="rë_" /> + <ngram occurrences="17" value="që" /> + <ngram occurrences="17" value="një_" /> + <ngram occurrences="17" value="it_" /> + <ngram occurrences="17" value="il" /> + <ngram occurrences="17" value="ik" /> + <ngram occurrences="17" value="e_s" /> + <ngram occurrences="16" value="ët" /> + <ngram occurrences="16" value="ë_m" /> + <ngram occurrences="16" value="të_t" /> + <ngram occurrences="16" value="që_" /> + <ngram occurrences="16" value="për_" /> + <ngram occurrences="16" value="or" /> + <ngram occurrences="16" value="ka" /> + <ngram occurrences="16" value="he_" /> + <ngram occurrences="16" value="etë" /> + <ngram occurrences="16" value="e_k" /> + <ngram occurrences="16" value="dhe" /> + <ngram occurrences="16" value="_ve" /> + <ngram occurrences="16" value="_një" /> + <ngram occurrences="16" value="_ng" /> + <ngram occurrences="16" value="_ki" /> + <ngram occurrences="16" value="_gj" /> + <ngram occurrences="15" value="ën_" /> + <ngram occurrences="15" value="ua" /> + <ngram occurrences="15" value="tu" /> + <ngram occurrences="15" value="rr" /> + <ngram occurrences="15" value="kis" /> + <ngram occurrences="15" value="ha" /> + <ngram occurrences="15" value="dhe_" /> + <ngram occurrences="15" value="_h" /> + <ngram occurrences="14" value="ë_a" /> + <ngram occurrences="14" value="së" /> + <ngram occurrences="14" value="pr" /> + <ngram occurrences="14" value="oh" /> + <ngram occurrences="14" value="kish" /> + <ngram occurrences="14" value="k_" /> + <ngram occurrences="14" value="ga" /> + <ngram occurrences="14" value="end" /> + <ngram occurrences="14" value="e_të_" /> + <ngram occurrences="14" value="e_të" /> + <ngram occurrences="14" value="di" /> + <ngram occurrences="14" value="c" /> + <ngram occurrences="14" value="_që_" /> + <ngram occurrences="14" value="_që" /> + <ngram occurrences="14" value="_kë" /> + <ngram occurrences="14" value="_kish" /> + <ngram occurrences="14" value="_kis" /> + <ngram occurrences="14" value="_ish" /> + <ngram occurrences="14" value="_is" /> + <ngram occurrences="13" value="un" /> + <ngram occurrences="13" value="nte_" /> + <ngram occurrences="13" value="nte" /> + <ngram occurrences="13" value="nga" /> + <ngram occurrences="13" value="më_" /> + <ngram occurrences="13" value="li" /> + <ngram occurrences="13" value="ko" /> + <ngram occurrences="13" value="ji" /> + <ngram occurrences="13" value="i_n" /> + <ngram occurrences="13" value="hi" /> + <ngram occurrences="13" value="hej_" /> + <ngram occurrences="13" value="hej" /> + <ngram occurrences="13" value="atë" /> + <ngram occurrences="13" value="_nga" /> + <ngram occurrences="13" value="_ku" /> + <ngram occurrences="13" value="_isht" /> + <ngram occurrences="13" value="_dh" /> + <ngram occurrences="12" value="ë_të_" /> + <ngram occurrences="12" value="ë_të" /> + <ngram occurrences="12" value="to" /> + <ngram occurrences="12" value="ri_" /> + <ngram occurrences="12" value="kur" /> + <ngram occurrences="12" value="jo_" /> + <ngram occurrences="12" value="jo" /> + <ngram occurrences="12" value="_u" /> + <ngram occurrences="12" value="_një_" /> + <ngram occurrences="12" value="_më" /> + <ngram occurrences="12" value="_dhe_" /> + <ngram occurrences="12" value="_dhe" /> + <ngram occurrences="11" value="uk" /> + <ngram occurrences="11" value="të_p" /> + <ngram occurrences="11" value="ta_" /> + <ngram occurrences="11" value="shi" /> + <ngram occurrences="11" value="sa" /> + <ngram occurrences="11" value="rt" /> + <ngram occurrences="11" value="r_t" /> + <ngram occurrences="11" value="ni_" /> + <ngram occurrences="11" value="nd_" /> + <ngram occurrences="11" value="n_e_" /> + <ngram occurrences="11" value="n_e" /> + <ngram occurrences="11" value="m_" /> + <ngram occurrences="11" value="lë" /> + <ngram occurrences="11" value="kët" /> + <ngram occurrences="11" value="kisht" /> + <ngram occurrences="11" value="hë" /> + <ngram occurrences="11" value="hu" /> + <ngram occurrences="11" value="gji" /> + <ngram occurrences="11" value="et_" /> + <ngram occurrences="11" value="e_p" /> + <ngram occurrences="11" value="e_me" /> + <ngram occurrences="11" value="d_" /> + <ngram occurrences="11" value="bë" /> + <ngram occurrences="11" value="ap" /> + <ngram occurrences="11" value="ai" /> + <ngram occurrences="11" value="_te" /> + <ngram occurrences="11" value="_për_" /> + <ngram occurrences="11" value="_pr" /> + <ngram occurrences="11" value="_po" /> + <ngram occurrences="11" value="_mi" /> + <ngram occurrences="11" value="_kët" /> + <ngram occurrences="10" value="vet" /> + <ngram occurrences="10" value="va" /> + <ngram occurrences="10" value="ul" /> + <ngram occurrences="10" value="uar_" /> + <ngram occurrences="10" value="uar" /> + <ngram occurrences="10" value="tër" /> + <ngram occurrences="10" value="të_m" /> + <ngram occurrences="10" value="tha" /> + <ngram occurrences="10" value="silv" /> + <ngram occurrences="10" value="sil" /> + <ngram occurrences="10" value="r_n" /> + <ngram occurrences="10" value="qe" /> + <ngram occurrences="10" value="po_" /> + <ngram occurrences="10" value="ohe" /> + <ngram occurrences="10" value="ndo" /> + <ngram occurrences="10" value="na" /> + <ngram occurrences="10" value="mir" /> + <ngram occurrences="10" value="men" /> + <ngram occurrences="10" value="mb" /> + <ngram occurrences="10" value="lv" /> + <ngram occurrences="10" value="le" /> + <ngram occurrences="10" value="jit" /> + <ngram occurrences="10" value="ir" /> + <ngram occurrences="10" value="imi" /> + <ngram occurrences="10" value="ilv" /> + <ngram occurrences="10" value="gjit" /> + <ngram occurrences="10" value="e_v" /> + <ngram occurrences="10" value="e_d" /> + <ngram occurrences="10" value="ar_" /> + <ngram occurrences="10" value="a_p" /> + <ngram occurrences="10" value="_vet" /> + <ngram occurrences="10" value="_th" /> + <ngram occurrences="10" value="_ta" /> + <ngram occurrences="10" value="_silv" /> + <ngram occurrences="10" value="_sil" /> + <ngram occurrences="10" value="_se" /> + <ngram occurrences="10" value="_r" /> + <ngram occurrences="10" value="_më_" /> + <ngram occurrences="10" value="_c" /> + <ngram occurrences="9" value="ëri" /> + <ngram occurrences="9" value="ë_v" /> + <ngram occurrences="9" value="ë_për" /> + <ngram occurrences="9" value="ë_pë" /> + <ngram occurrences="9" value="ë_pa" /> + <ngram occurrences="9" value="ë_l" /> + <ngram occurrences="9" value="und" /> + <ngram occurrences="9" value="uk_" /> + <ngram occurrences="9" value="të_n" /> + <ngram occurrences="9" value="të_k" /> + <ngram occurrences="9" value="së_" /> + <ngram occurrences="9" value="rs" /> + <ngram occurrences="9" value="ro" /> + <ngram occurrences="9" value="ra_" /> + <ngram occurrences="9" value="pi" /> + <ngram occurrences="9" value="ont" /> + <ngram occurrences="9" value="ohej_" /> + <ngram occurrences="9" value="ohej" /> + <ngram occurrences="9" value="nu" /> + <ngram occurrences="9" value="nga_" /> + <ngram occurrences="9" value="ka_" /> + <ngram occurrences="9" value="jith" /> + <ngram occurrences="9" value="je_" /> + <ngram occurrences="9" value="ith" /> + <ngram occurrences="9" value="i_s" /> + <ngram occurrences="9" value="gu" /> + <ngram occurrences="9" value="gjith" /> + <ngram occurrences="9" value="ga_" /> + <ngram occurrences="9" value="de" /> + <ngram occurrences="9" value="br" /> + <ngram occurrences="9" value="al" /> + <ngram occurrences="9" value="ak" /> + <ngram occurrences="9" value="a_s" /> + <ngram occurrences="9" value="a_n" /> + <ngram occurrences="9" value="a_m" /> + <ngram occurrences="9" value="_u_" /> + <ngram occurrences="9" value="_të_t" /> + <ngram occurrences="9" value="_të_m" /> + <ngram occurrences="9" value="_të_k" /> + <ngram occurrences="9" value="_tha" /> + <ngram occurrences="9" value="_se_" /> + <ngram occurrences="9" value="_nu" /> + <ngram occurrences="9" value="_nga_" /> + <ngram occurrences="9" value="_kur" /> + <ngram occurrences="9" value="_ka" /> + <ngram occurrences="9" value="_j" /> + <ngram occurrences="9" value="_e_s" /> + <ngram occurrences="9" value="_bë" /> + <ngram occurrences="8" value="ëm" /> + <ngram occurrences="8" value="ë_sh" /> + <ngram occurrences="8" value="ë_e_" /> + <ngram occurrences="8" value="ë_e" /> + <ngram occurrences="8" value="ë_d" /> + <ngram occurrences="8" value="va_" /> + <ngram occurrences="8" value="të_s" /> + <ngram occurrences="8" value="tha_" /> + <ngram occurrences="8" value="tet" /> + <ngram occurrences="8" value="te_m" /> + <ngram occurrences="8" value="tan" /> + <ngram occurrences="8" value="silva" /> + <ngram occurrences="8" value="rm" /> + <ngram occurrences="8" value="rit" /> + <ngram occurrences="8" value="rg" /> + <ngram occurrences="8" value="rej" /> + <ngram occurrences="8" value="oni" /> + <ngram occurrences="8" value="nuk_" /> + <ngram occurrences="8" value="nuk" /> + <ngram occurrences="8" value="nin_" /> + <ngram occurrences="8" value="nin" /> + <ngram occurrences="8" value="mend" /> + <ngram occurrences="8" value="lva_" /> + <ngram occurrences="8" value="lva" /> + <ngram occurrences="8" value="lo" /> + <ngram occurrences="8" value="ke" /> + <ngram occurrences="8" value="jt" /> + <ngram occurrences="8" value="j_n" /> + <ngram occurrences="8" value="ilva_" /> + <ngram occurrences="8" value="ilva" /> + <ngram occurrences="8" value="id" /> + <ngram occurrences="8" value="i_k" /> + <ngram occurrences="8" value="ha_" /> + <ngram occurrences="8" value="h_" /> + <ngram occurrences="8" value="fa" /> + <ngram occurrences="8" value="bi" /> + <ngram occurrences="8" value="a_e_" /> + <ngram occurrences="8" value="a_e" /> + <ngram occurrences="8" value="_ç" /> + <ngram occurrences="8" value="_z" /> + <ngram occurrences="8" value="_të_p" /> + <ngram occurrences="8" value="_tha_" /> + <ngram occurrences="8" value="_sa" /> + <ngram occurrences="8" value="_nuk_" /> + <ngram occurrences="8" value="_nuk" /> + <ngram occurrences="8" value="_ndo" /> + <ngram occurrences="8" value="_mir" /> + <ngram occurrences="7" value="ëtë_" /> + <ngram occurrences="7" value="ëtë" /> + <ngram occurrences="7" value="ër_t" /> +</ngrams> diff --git a/src/plugins/language/arabic.klp b/src/plugins/language/arabic.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="778" value="_" /> + <ngram occurrences="538" value="ç" /> + <ngram occurrences="423" value="á" /> + <ngram occurrences="274" value="í" /> + <ngram occurrences="266" value="æ" /> + <ngram occurrences="259" value="ã" /> + <ngram occurrences="228" value="çá" /> + <ngram occurrences="204" value="_ç" /> + <ngram occurrences="200" value="ä" /> + <ngram occurrences="174" value="_çá" /> + <ngram occurrences="167" value="ú" /> + <ngram occurrences="154" value="ñ" /> + <ngram occurrences="146" value="è" /> + <ngram occurrences="130" value="ê" /> + <ngram occurrences="124" value="å" /> + <ngram occurrences="117" value="ï" /> + <ngram occurrences="117" value="ì" /> + <ngram occurrences="117" value="_ã" /> + <ngram occurrences="112" value="ó" /> + <ngram occurrences="105" value="_æ" /> + <ngram occurrences="100" value="ä_" /> + <ngram occurrences="94" value="ý" /> + <ngram occurrences="81" value="ç_" /> + <ngram occurrences="80" value="õ" /> + <ngram occurrences="77" value="ß" /> + <ngram occurrences="72" value="é" /> + <ngram occurrences="63" value="é_" /> + <ngram occurrences="62" value="þ" /> + <ngram occurrences="60" value="å_" /> + <ngram occurrences="56" value="áç" /> + <ngram occurrences="52" value="í_" /> + <ngram occurrences="48" value="áã" /> + <ngram occurrences="47" value="çä" /> + <ngram occurrences="47" value="á_" /> + <ngram occurrences="47" value="_ý" /> + <ngram occurrences="47" value="_è" /> + <ngram occurrences="45" value="ú_" /> + <ngram occurrences="45" value="ö" /> + <ngram occurrences="44" value="ì_" /> + <ngram occurrences="43" value="æá" /> + <ngram occurrences="42" value="ï_" /> + <ngram occurrences="41" value="ó_" /> + <ngram occurrences="41" value="ãä" /> + <ngram occurrences="38" value="æì" /> + <ngram occurrences="37" value="íç" /> + <ngram occurrences="36" value="æï" /> + <ngram occurrences="36" value="_í" /> + <ngram occurrences="35" value="çáã" /> + <ngram occurrences="35" value="æç" /> + <ngram occurrences="35" value="_ú" /> + <ngram occurrences="35" value="_á" /> + <ngram occurrences="34" value="ø" /> + <ngram occurrences="34" value="ò" /> + <ngram occurrences="34" value="ñ_" /> + <ngram occurrences="34" value="ä_ç" /> + <ngram occurrences="34" value="_çáã" /> + <ngram occurrences="33" value="ìæ" /> + <ngram occurrences="33" value="_ãä" /> + <ngram occurrences="32" value="ð" /> + <ngram occurrences="32" value="ë" /> + <ngram occurrences="31" value="ô" /> + <ngram occurrences="30" value="æìæ" /> + <ngram occurrences="30" value="ãí" /> + <ngram occurrences="30" value="áì" /> + <ngram occurrences="29" value="ýí" /> + <ngram occurrences="29" value="áú" /> + <ngram occurrences="29" value="áç_" /> + <ngram occurrences="28" value="ìæï" /> + <ngram occurrences="27" value="çä_" /> + <ngram occurrences="27" value="æìæï" /> + <ngram occurrences="27" value="ãä_" /> + <ngram occurrences="27" value="áì_" /> + <ngram occurrences="27" value="áæ" /> + <ngram occurrences="26" value="çæ" /> + <ngram occurrences="26" value="çáú" /> + <ngram occurrences="26" value="ä_çá" /> + <ngram occurrences="26" value="ãñ" /> + <ngram occurrences="26" value="ã_" /> + <ngram occurrences="26" value="_ê" /> + <ngram occurrences="25" value="úá" /> + <ngram occurrences="25" value="ö_" /> + <ngram occurrences="25" value="õ_" /> + <ngram occurrences="25" value="çáæ" /> + <ngram occurrences="25" value="_æç" /> + <ngram occurrences="24" value="íä" /> + <ngram occurrences="24" value="é_ç" /> + <ngram occurrences="24" value="_ýí" /> + <ngram occurrences="24" value="_ãí" /> + <ngram occurrences="23" value="çê" /> + <ngram occurrences="23" value="áí" /> + <ngram occurrences="23" value="_çáú" /> + <ngram occurrences="22" value="úñ" /> + <ngram occurrences="22" value="_ãä_" /> + <ngram occurrences="22" value="_ß" /> + <ngram occurrences="21" value="èú" /> + <ngram occurrences="21" value="_çä" /> + <ngram occurrences="21" value="_çáæ" /> + <ngram occurrences="20" value="ýí_" /> + <ngram occurrences="20" value="ñç" /> + <ngram occurrences="20" value="è_" /> + <ngram occurrences="19" value="êè" /> + <ngram occurrences="19" value="ê_" /> + <ngram occurrences="19" value="é_çá" /> + <ngram occurrences="19" value="_ýí_" /> + <ngram occurrences="18" value="æï_" /> + <ngram occurrences="18" value="æä" /> + <ngram occurrences="18" value="æã" /> + <ngram occurrences="18" value="áæìæ" /> + <ngram occurrences="18" value="áæì" /> + <ngram occurrences="18" value="áå" /> + <ngram occurrences="18" value="ßç" /> + <ngram occurrences="17" value="úáì_" /> + <ngram occurrences="17" value="úáì" /> + <ngram occurrences="17" value="ñè" /> + <ngram occurrences="17" value="ðç" /> + <ngram occurrences="17" value="ìæï_" /> + <ngram occurrences="17" value="êõ" /> + <ngram occurrences="17" value="çæá" /> + <ngram occurrences="17" value="çáæìæ" /> + <ngram occurrences="17" value="çáæì" /> + <ngram occurrences="17" value="çá_" /> + <ngram occurrences="17" value="æìæï_" /> + <ngram occurrences="17" value="åç" /> + <ngram occurrences="17" value="ãíç" /> + <ngram occurrences="17" value="_ñ" /> + <ngram occurrences="17" value="_ãíç" /> + <ngram occurrences="16" value="ñê" /> + <ngram occurrences="16" value="íï" /> + <ngram occurrences="16" value="í_ç" /> + <ngram occurrences="16" value="èú_" /> + <ngram occurrences="16" value="èí" /> + <ngram occurrences="16" value="ãó" /> + <ngram occurrences="16" value="áæìæï" /> + <ngram occurrences="16" value="_çä_" /> + <ngram occurrences="16" value="_å" /> + <ngram occurrences="15" value="ú_ã" /> + <ngram occurrences="15" value="íñ" /> + <ngram occurrences="15" value="íçæá" /> + <ngram occurrences="15" value="íçæ" /> + <ngram occurrences="15" value="èç" /> + <ngram occurrences="15" value="çï" /> + <ngram occurrences="15" value="æçá" /> + <ngram occurrences="15" value="ä_ã" /> + <ngram occurrences="15" value="ãíçæá" /> + <ngram occurrences="15" value="ãíçæ" /> + <ngram occurrences="15" value="áê" /> + <ngram occurrences="15" value="_çáæì" /> + <ngram occurrences="15" value="_æçá" /> + <ngram occurrences="15" value="_æá" /> + <ngram occurrences="15" value="_ãíçæ" /> + <ngram occurrences="14" value="ò_" /> + <ngram occurrences="14" value="íó" /> + <ngram occurrences="14" value="í_çá" /> + <ngram occurrences="14" value="êå" /> + <ngram occurrences="14" value="ç_ã" /> + <ngram occurrences="14" value="åç_" /> + <ngram occurrences="14" value="å_ç" /> + <ngram occurrences="14" value="äí" /> + <ngram occurrences="14" value="ãú" /> + <ngram occurrences="14" value="ãñê" /> + <ngram occurrences="14" value="ãç" /> + <ngram occurrences="14" value="áå_" /> + <ngram occurrences="14" value="áä" /> + <ngram occurrences="14" value="_úá" /> + <ngram occurrences="14" value="_æã" /> + <ngram occurrences="13" value="ñêè" /> + <ngram occurrences="13" value="ïç" /> + <ngram occurrences="13" value="èé" /> + <ngram occurrences="13" value="æá_" /> + <ngram occurrences="13" value="äç" /> + <ngram occurrences="13" value="ãñêè" /> + <ngram occurrences="13" value="ãæ" /> + <ngram occurrences="13" value="ãä_çá" /> + <ngram occurrences="13" value="ãä_ç" /> + <ngram occurrences="13" value="áõ" /> + <ngram occurrences="13" value="áó" /> + <ngram occurrences="13" value="á_ç" /> + <ngram occurrences="13" value="_ãñ" /> + <ngram occurrences="12" value="þí" /> + <ngram occurrences="12" value="ýí_ç" /> + <ngram occurrences="12" value="úñè" /> + <ngram occurrences="12" value="úä" /> + <ngram occurrences="12" value="óã" /> + <ngram occurrences="12" value="ñêèé_" /> + <ngram occurrences="12" value="ñêèé" /> + <ngram occurrences="12" value="ïå" /> + <ngram occurrences="12" value="î" /> + <ngram occurrences="12" value="íþ" /> + <ngram occurrences="12" value="íê" /> + <ngram occurrences="12" value="íé" /> + <ngram occurrences="12" value="íä_" /> + <ngram occurrences="12" value="íá" /> + <ngram occurrences="12" value="êèé_" /> + <ngram occurrences="12" value="êèé" /> + <ngram occurrences="12" value="èé_" /> + <ngram occurrences="12" value="èá" /> + <ngram occurrences="12" value="çæá_" /> + <ngram occurrences="12" value="çáê" /> + <ngram occurrences="12" value="çáç" /> + <ngram occurrences="12" value="ç_í" /> + <ngram occurrences="12" value="æñ" /> + <ngram occurrences="12" value="å_çá" /> + <ngram occurrences="12" value="å_æ" /> + <ngram occurrences="12" value="ãñêèé" /> + <ngram occurrences="12" value="áá" /> + <ngram occurrences="12" value="ß_" /> + <ngram occurrences="12" value="_ýí_ç" /> + <ngram occurrences="12" value="_ãä_ç" /> + <ngram occurrences="11" value="þï" /> + <ngram occurrences="11" value="ýí_çá" /> + <ngram occurrences="11" value="úñèú_" /> + <ngram occurrences="11" value="úñèú" /> + <ngram occurrences="11" value="ú_æ" /> + <ngram occurrences="11" value="ó_çá" /> + <ngram occurrences="11" value="ó_ç" /> + <ngram occurrences="11" value="ñèú_" /> + <ngram occurrences="11" value="ñèú" /> + <ngram occurrences="11" value="ñ_çá" /> + <ngram occurrences="11" value="ñ_ç" /> + <ngram occurrences="11" value="ðçê" /> + <ngram occurrences="11" value="íé_" /> + <ngram occurrences="11" value="íçæá_" /> + <ngram occurrences="11" value="íã" /> + <ngram occurrences="11" value="ì_ç" /> + <ngram occurrences="11" value="çè" /> + <ngram occurrences="11" value="çáúñè" /> + <ngram occurrences="11" value="çáúñ" /> + <ngram occurrences="11" value="ç_ç" /> + <ngram occurrences="11" value="æä_" /> + <ngram occurrences="11" value="áúñèú" /> + <ngram occurrences="11" value="áúñè" /> + <ngram occurrences="11" value="áúñ" /> + <ngram occurrences="11" value="áç_í" /> + <ngram occurrences="11" value="áß" /> + <ngram occurrences="11" value="á_çá" /> + <ngram occurrences="11" value="á_ã" /> + <ngram occurrences="11" value="_úáì_" /> + <ngram occurrences="11" value="_úáì" /> + <ngram occurrences="11" value="_çáúñ" /> + <ngram occurrences="11" value="_áç" /> + <ngram occurrences="10" value="úí" /> + <ngram occurrences="10" value="óç" /> + <ngram occurrences="10" value="ñó" /> + <ngram occurrences="10" value="ñí" /> + <ngram occurrences="10" value="íí" /> + <ngram occurrences="10" value="í_æ" /> + <ngram occurrences="10" value="ìè" /> + <ngram occurrences="10" value="ì_çá" /> + <ngram occurrences="10" value="êå_" /> + <ngram occurrences="10" value="é_æ" /> + <ngram occurrences="10" value="é_ã" /> + <ngram occurrences="10" value="çú" /> + <ngram occurrences="10" value="çì" /> + <ngram occurrences="10" value="çã" /> + <ngram occurrences="10" value="çáãñ" /> + <ngram occurrences="10" value="çáá" /> + <ngram occurrences="10" value="æõ" /> + <ngram occurrences="10" value="æí" /> + <ngram occurrences="10" value="æáç" /> + <ngram occurrences="10" value="äæ" /> + <ngram occurrences="10" value="áó_" /> + <ngram occurrences="10" value="áãñ" /> + <ngram occurrences="10" value="áã_" /> + <ngram occurrences="10" value="ßæ" /> + <ngram occurrences="10" value="_þ" /> + <ngram occurrences="10" value="_ô" /> + <ngram occurrences="10" value="_çáç" /> + <ngram occurrences="10" value="_çáãñ" /> + <ngram occurrences="9" value="úç" /> + <ngram occurrences="9" value="ú_ãí" /> + <ngram occurrences="9" value="ö_çá" /> + <ngram occurrences="9" value="ö_ç" /> + <ngram occurrences="9" value="óí" /> + <ngram occurrences="9" value="íñ_" /> + <ngram occurrences="9" value="ìè_" /> + <ngram occurrences="9" value="çó" /> + <ngram occurrences="9" value="çí" /> + <ngram occurrences="9" value="çìè_" /> + <ngram occurrences="9" value="çìè" /> + <ngram occurrences="9" value="çäí" /> + <ngram occurrences="9" value="çáì" /> + <ngram occurrences="9" value="çáä" /> + <ngram occurrences="9" value="ç_è" /> + <ngram occurrences="9" value="ç_çá" /> + <ngram occurrences="9" value="æçìè_" /> + <ngram occurrences="9" value="æçìè" /> + <ngram occurrences="9" value="æçì" /> + <ngram occurrences="9" value="æáç_" /> + <ngram occurrences="9" value="äí_" /> + <ngram occurrences="9" value="ãö" /> + <ngram occurrences="9" value="ãä_ã" /> + <ngram occurrences="9" value="ßæä" /> + <ngram occurrences="9" value="_èá" /> + <ngram occurrences="9" value="_æáç" /> + <ngram occurrences="9" value="_ãä_ã" /> + <ngram occurrences="9" value="_áç_" /> + <ngram occurrences="8" value="û" /> + <ngram occurrences="8" value="ú_ç" /> + <ngram occurrences="8" value="öç" /> + <ngram occurrences="8" value="õæ" /> + <ngram occurrences="8" value="ó_è" /> + <ngram occurrences="8" value="ðçêå_" /> + <ngram occurrences="8" value="ðçêå" /> + <ngram occurrences="8" value="ïí" /> + <ngram occurrences="8" value="ïé" /> + <ngram occurrences="8" value="íçá_" /> + <ngram occurrences="8" value="íçá" /> + <ngram occurrences="8" value="íå" /> + <ngram occurrences="8" value="íß" /> + <ngram occurrences="8" value="í_çáã" /> + <ngram occurrences="8" value="ëá" /> + <ngram occurrences="8" value="êú" /> + <ngram occurrences="8" value="êí" /> + <ngram occurrences="8" value="é_ýí" /> + <ngram occurrences="8" value="é_ý" /> + <ngram occurrences="8" value="èçá" /> + <ngram occurrences="8" value="èä" /> + <ngram occurrences="8" value="èáçï" /> + <ngram occurrences="8" value="èáç" /> + <ngram occurrences="8" value="è_çá" /> + <ngram occurrences="8" value="è_ç" /> + <ngram occurrences="8" value="çêå_" /> + <ngram occurrences="8" value="çêå" /> + <ngram occurrences="8" value="çê_" /> + <ngram occurrences="8" value="çä_ç" /> + <ngram occurrences="8" value="çáãñê" /> + <ngram occurrences="8" value="çß" /> + <ngram occurrences="8" value="ç_æ" /> + <ngram occurrences="8" value="ç_á" /> + <ngram occurrences="8" value="æþ" /> + <ngram occurrences="8" value="æñ_" /> + <ngram occurrences="8" value="åä" /> + <ngram occurrences="8" value="äý" /> + <ngram occurrences="8" value="äú" /> + <ngram occurrences="8" value="äê" /> + <ngram occurrences="8" value="äå" /> + <ngram occurrences="8" value="ä_æ" /> + <ngram occurrences="8" value="ãõ" /> + <ngram occurrences="8" value="áíó" /> + <ngram occurrences="8" value="áçï" /> + <ngram occurrences="8" value="áãñêè" /> + <ngram occurrences="8" value="áãñê" /> + <ngram occurrences="8" value="ááå_" /> + <ngram occurrences="8" value="ááå" /> + <ngram occurrences="8" value="ßæä_" /> + <ngram occurrences="8" value="ßá" /> + <ngram occurrences="8" value="_ó" /> + <ngram occurrences="8" value="_ðçê" /> + <ngram occurrences="8" value="_ðç" /> + <ngram occurrences="8" value="_ð" /> + <ngram occurrences="8" value="_íß" /> + <ngram occurrences="8" value="_èçá" /> + <ngram occurrences="8" value="_èç" /> + <ngram occurrences="8" value="_èáçï" /> + <ngram occurrences="8" value="_èáç" /> + <ngram occurrences="8" value="_çáì" /> + <ngram occurrences="8" value="_çáê" /> + <ngram occurrences="8" value="_çáá" /> + <ngram occurrences="8" value="_æáç_" /> + <ngram occurrences="8" value="_ä" /> + <ngram occurrences="8" value="_ãú" /> + <ngram occurrences="7" value="þç" /> + <ngram occurrences="7" value="ýú" /> + <ngram occurrences="7" value="ýæ" /> + <ngram occurrences="7" value="ý_" /> + <ngram occurrences="7" value="úþ" /> + <ngram occurrences="7" value="úï" /> + <ngram occurrences="7" value="úíä" /> + <ngram occurrences="7" value="ú_ãíç" /> + <ngram occurrences="7" value="õå" /> + <ngram occurrences="7" value="ôí" /> + <ngram occurrences="7" value="óê" /> + <ngram occurrences="7" value="ñã" /> + <ngram occurrences="7" value="ïé_" /> + <ngram occurrences="7" value="ïå_" /> + <ngram occurrences="7" value="ï_æ" /> + <ngram occurrences="7" value="ï_ã" /> + <ngram occurrences="7" value="íì" /> + <ngram occurrences="7" value="íßæä_" /> + <ngram occurrences="7" value="íßæä" /> + <ngram occurrences="7" value="íßæ" /> + <ngram occurrences="7" value="ìç" /> + <ngram occurrences="7" value="ì_ã" /> + <ngram occurrences="7" value="êõ_" /> + <ngram occurrences="7" value="é_ýí_" /> + <ngram occurrences="7" value="èíä" /> + <ngram occurrences="7" value="çý" /> + <ngram occurrences="7" value="çô" /> + <ngram occurrences="7" value="çñ" /> + <ngram occurrences="7" value="çáñ" /> + <ngram occurrences="7" value="çáí" /> + <ngram occurrences="7" value="çáæçì" /> + <ngram occurrences="7" value="çáæç" /> + <ngram occurrences="7" value="çááå_" /> + <ngram occurrences="7" value="çááå" /> + <ngram occurrences="7" value="æè" /> + <ngram occurrences="7" value="åú" /> + <ngram occurrences="7" value="åð" /> + <ngram occurrences="7" value="å_ã" /> + <ngram occurrences="7" value="äú_" /> +</ngrams> diff --git a/src/plugins/language/arabic2.klp b/src/plugins/language/arabic2.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1554" value="_" /> + <ngram occurrences="897" value="ø" /> + <ngram occurrences="759" value="_ø" /> + <ngram occurrences="750" value="ù" /> + <ngram occurrences="723" value="ù_" /> + <ngram occurrences="614" value="_ù" /> + <ngram occurrences="603" value="_ù_" /> + <ngram occurrences="596" value="ø_" /> + <ngram occurrences="499" value="_ø_" /> + <ngram occurrences="446" value="ù_ø" /> + <ngram occurrences="378" value="_ù_ø" /> + <ngram occurrences="312" value="ø_ù_" /> + <ngram occurrences="312" value="ø_ù" /> + <ngram occurrences="291" value="ù_ø_" /> + <ngram occurrences="275" value="ø_ø" /> + <ngram occurrences="275" value="_ø_ù_" /> + <ngram occurrences="275" value="_ø_ù" /> + <ngram occurrences="269" value="ù_ù_" /> + <ngram occurrences="269" value="ù_ù" /> + <ngram occurrences="229" value="_ù_ø_" /> + <ngram occurrences="218" value="_ù_ù_" /> + <ngram occurrences="218" value="_ù_ù" /> + <ngram occurrences="217" value="_ø_ø" /> + <ngram occurrences="189" value="ø_ù_ø" /> + <ngram occurrences="180" value="ø_ø_" /> + <ngram occurrences="175" value="ù_ù_ø" /> + <ngram occurrences="164" value="ç" /> + <ngram occurrences="156" value="ù_ø_ù" /> + <ngram occurrences="132" value="_ø_ø_" /> + <ngram occurrences="131" value="ù_ø_ø" /> + <ngram occurrences="122" value="ø_ù_ù" /> + <ngram occurrences="99" value="ø_ø_ù" /> + <ngram occurrences="99" value="è" /> + <ngram occurrences="89" value="ä" /> + <ngram occurrences="88" value="ù_ù_ù" /> + <ngram occurrences="86" value="øª" /> + <ngram occurrences="86" value="ª" /> + <ngram occurrences="78" value="ø_ø_ø" /> + <ngram occurrences="77" value="_øª" /> + <ngram occurrences="73" value="ê" /> + <ngram occurrences="67" value="ø¹" /> + <ngram occurrences="67" value="¹" /> + <ngram occurrences="63" value="¨" /> + <ngram occurrences="63" value="ø¨" /> + <ngram occurrences="58" value="_ø¨" /> + <ngram occurrences="58" value="_ç" /> + <ngram occurrences="52" value="_ø¹" /> + <ngram occurrences="51" value="çä" /> + <ngram occurrences="50" value="æ" /> + <ngram occurrences="49" value="ù_øª" /> + <ngram occurrences="49" value="_ù_øª" /> + <ngram occurrences="48" value="å" /> + <ngram occurrences="45" value="_çä" /> + <ngram occurrences="42" value="ã" /> + <ngram occurrences="41" value="ñ" /> + <ngram occurrences="38" value="¨ø" /> + <ngram occurrences="38" value="ø¨ø" /> + <ngram occurrences="38" value="ï" /> + <ngram occurrences="38" value="_ø¨ø" /> + <ngram occurrences="37" value="ç_" /> + <ngram occurrences="35" value="øªø" /> + <ngram occurrences="35" value="ªø" /> + <ngram occurrences="34" value="ø¹ù_" /> + <ngram occurrences="34" value="ø¹ù" /> + <ngram occurrences="34" value="¹ù_" /> + <ngram occurrences="34" value="¹ù" /> + <ngram occurrences="33" value="î" /> + <ngram occurrences="31" value="ù_ø¹" /> + <ngram occurrences="31" value="ø³" /> + <ngram occurrences="31" value="³" /> + <ngram occurrences="31" value="_ù_ø¹" /> + <ngram occurrences="31" value="_ø³" /> + <ngram occurrences="30" value="_øªø" /> + <ngram occurrences="29" value="øªù_" /> + <ngram occurrences="29" value="øªù" /> + <ngram occurrences="29" value="øªø_" /> + <ngram occurrences="29" value="æ_" /> + <ngram occurrences="29" value="ªù_" /> + <ngram occurrences="29" value="ªù" /> + <ngram occurrences="29" value="ªø_" /> + <ngram occurrences="28" value="ø_ø¨" /> + <ngram occurrences="28" value="_ø¹ù_" /> + <ngram occurrences="28" value="_ø¹ù" /> + <ngram occurrences="26" value="ù_ø¨" /> + <ngram occurrences="26" value="ù_øªø" /> + <ngram occurrences="26" value="ø_øª" /> + <ngram occurrences="26" value="_øªø_" /> + <ngram occurrences="25" value="¨ø_" /> + <ngram occurrences="25" value="ø¨ø_" /> + <ngram occurrences="25" value="ì" /> + <ngram occurrences="25" value="_ø¨ø_" /> + <ngram occurrences="25" value="_øªù_" /> + <ngram occurrences="25" value="_øªù" /> + <ngram occurrences="25" value="_è" /> + <ngram occurrences="24" value="ø_ø¨ø" /> + <ngram occurrences="24" value="ð" /> + <ngram occurrences="24" value="_ù_ø¨" /> + <ngram occurrences="24" value="_ø_øª" /> + <ngram occurrences="23" value="¨ù_" /> + <ngram occurrences="23" value="¨ù" /> + <ngram occurrences="23" value="ø¨ù_" /> + <ngram occurrences="23" value="ø¨ù" /> + <ngram occurrences="23" value="_ø_ø¨" /> + <ngram occurrences="22" value="¸" /> + <ngram occurrences="22" value="ø¸" /> + <ngram occurrences="22" value="øª_" /> + <ngram occurrences="22" value="á" /> + <ngram occurrences="22" value="ª_" /> + <ngram occurrences="22" value="_øª_" /> + <ngram occurrences="20" value="ù_ø³" /> + <ngram occurrences="20" value="ø¹ù_ø" /> + <ngram occurrences="20" value="ø_ø¹" /> + <ngram occurrences="20" value="¹ù_ø" /> + <ngram occurrences="20" value="_å" /> + <ngram occurrences="19" value="ø¹ø_" /> + <ngram occurrences="19" value="ø¹ø" /> + <ngram occurrences="19" value="ø³ø" /> + <ngram occurrences="19" value="í" /> + <ngram occurrences="19" value="¹ø_" /> + <ngram occurrences="19" value="¹ø" /> + <ngram occurrences="19" value="³ø" /> + <ngram occurrences="19" value="_ù_ø³" /> + <ngram occurrences="19" value="_ø³ø" /> + <ngram occurrences="19" value="_ø_ø¹" /> + <ngram occurrences="18" value="é" /> + <ngram occurrences="18" value="¹ù_ø_" /> + <ngram occurrences="18" value="_ø¸" /> + <ngram occurrences="18" value="_ø¨ù_" /> + <ngram occurrences="18" value="_ø¨ù" /> + <ngram occurrences="17" value="ù_ø¹ù" /> + <ngram occurrences="17" value="øªù_ø" /> + <ngram occurrences="17" value="øªø_ø" /> + <ngram occurrences="17" value="ò" /> + <ngram occurrences="17" value="ªù_ø" /> + <ngram occurrences="17" value="ªø_ø" /> + <ngram occurrences="17" value="_ã" /> + <ngram occurrences="16" value="¨ø_ø" /> + <ngram occurrences="16" value="ù_øªù" /> + <ngram occurrences="16" value="ø¨ø_ø" /> + <ngram occurrences="15" value="øª_ø" /> + <ngram occurrences="15" value="ø_øª_" /> + <ngram occurrences="15" value="ï_" /> + <ngram occurrences="15" value="î_" /> + <ngram occurrences="15" value="ª_ø" /> + <ngram occurrences="15" value="_øª_ø" /> + <ngram occurrences="14" value="¨ø_ø_" /> + <ngram occurrences="14" value="ù_ø¸" /> + <ngram occurrences="14" value="ø¹ù_ù" /> + <ngram occurrences="14" value="ø¹_" /> + <ngram occurrences="14" value="ìè" /> + <ngram occurrences="14" value="ê_" /> + <ngram occurrences="14" value="èç" /> + <ngram occurrences="14" value="¹ù_ù_" /> + <ngram occurrences="14" value="¹ù_ù" /> + <ngram occurrences="14" value="¹_" /> + <ngram occurrences="13" value="øµ" /> + <ngram occurrences="13" value="ðç" /> + <ngram occurrences="13" value="é_" /> + <ngram occurrences="13" value="µ" /> + <ngram occurrences="13" value="ªù_ø_" /> + <ngram occurrences="13" value="ªø_ø_" /> + <ngram occurrences="13" value="_ø¹ø_" /> + <ngram occurrences="13" value="_ø¹ø" /> + <ngram occurrences="13" value="_ê" /> + <ngram occurrences="12" value="¸ø" /> + <ngram occurrences="12" value="¨ù_ù_" /> + <ngram occurrences="12" value="¨ù_ù" /> + <ngram occurrences="12" value="ù_ø¨ù" /> + <ngram occurrences="12" value="ù_ø¨ø" /> + <ngram occurrences="12" value="ø¸ø" /> + <ngram occurrences="12" value="ø¨ù_ù" /> + <ngram occurrences="12" value="øªù_ù" /> + <ngram occurrences="12" value="êç" /> + <ngram occurrences="12" value="èï" /> + <ngram occurrences="12" value="çè" /> + <ngram occurrences="12" value="äè" /> + <ngram occurrences="12" value="äç" /> + <ngram occurrences="12" value="ªù_ù_" /> + <ngram occurrences="12" value="ªù_ù" /> + <ngram occurrences="12" value="_ù_ø¸" /> + <ngram occurrences="11" value="¨ù_ø_" /> + <ngram occurrences="11" value="¨ù_ø" /> + <ngram occurrences="11" value="ø¨ù_ø" /> + <ngram occurrences="11" value="ø¹ø_ø" /> + <ngram occurrences="11" value="ò_" /> + <ngram occurrences="11" value="ìèï" /> + <ngram occurrences="11" value="èï_" /> + <ngram occurrences="11" value="èìèï" /> + <ngram occurrences="11" value="èìè" /> + <ngram occurrences="11" value="èì" /> + <ngram occurrences="11" value="è_" /> + <ngram occurrences="11" value="çê" /> + <ngram occurrences="11" value="çäè" /> + <ngram occurrences="11" value="ä_" /> + <ngram occurrences="11" value="â" /> + <ngram occurrences="11" value="¹ø_ø" /> + <ngram occurrences="11" value="_ø¸ø" /> + <ngram occurrences="11" value="_ø¹_" /> + <ngram occurrences="11" value="_çäè" /> + <ngram occurrences="10" value="ùä" /> + <ngram occurrences="10" value="ù_ø¸ø" /> + <ngram occurrences="10" value="ù_ø³ø" /> + <ngram occurrences="10" value="øªø_ù" /> + <ngram occurrences="10" value="øª_ø_" /> + <ngram occurrences="10" value="ø_ø¹ù" /> + <ngram occurrences="10" value="ø_ø³" /> + <ngram occurrences="10" value="ó" /> + <ngram occurrences="10" value="ìèï_" /> + <ngram occurrences="10" value="èìèï_" /> + <ngram occurrences="10" value="èä" /> + <ngram occurrences="10" value="çæ" /> + <ngram occurrences="10" value="æ_ç" /> + <ngram occurrences="10" value="ªø_ù_" /> + <ngram occurrences="10" value="ªø_ù" /> + <ngram occurrences="10" value="ª_ø_" /> + <ngram occurrences="10" value="_øµ" /> + <ngram occurrences="9" value="¸ù_" /> + <ngram occurrences="9" value="¸ù" /> + <ngram occurrences="9" value="¨ø_ù_" /> + <ngram occurrences="9" value="¨ø_ù" /> + <ngram occurrences="9" value="ù_ø¹ø" /> + <ngram occurrences="9" value="ø¸ù_" /> + <ngram occurrences="9" value="ø¸ù" /> + <ngram occurrences="9" value="ø¨ø_ù" /> + <ngram occurrences="9" value="ø³ù_" /> + <ngram occurrences="9" value="ø³ù" /> + <ngram occurrences="9" value="ø³øª" /> + <ngram occurrences="9" value="ø²" /> + <ngram occurrences="9" value="ø_ø³ø" /> + <ngram occurrences="9" value="ö" /> + <ngram occurrences="9" value="çç" /> + <ngram occurrences="9" value="¹ø_ø_" /> + <ngram occurrences="9" value="³ù_" /> + <ngram occurrences="9" value="³ù" /> + <ngram occurrences="9" value="³øª" /> + <ngram occurrences="9" value="²" /> + <ngram occurrences="9" value="ª_ø_ù" /> + <ngram occurrences="9" value="_ø³ù_" /> + <ngram occurrences="9" value="_ø³ù" /> + <ngram occurrences="9" value="_ø³øª" /> + <ngram occurrences="9" value="_ø²" /> + <ngram occurrences="9" value="_ø_ø³" /> + <ngram occurrences="8" value="¸ø_" /> + <ngram occurrences="8" value="¨ø¹" /> + <ngram occurrences="8" value="ù_ø³ù" /> + <ngram occurrences="8" value="ø¸ø_" /> + <ngram occurrences="8" value="ø¨ø¹" /> + <ngram occurrences="8" value="øº" /> + <ngram occurrences="8" value="ø¹ø_ù" /> + <ngram occurrences="8" value="ø_øªù" /> + <ngram occurrences="8" value="ñ_" /> + <ngram occurrences="8" value="êï" /> + <ngram occurrences="8" value="çç_" /> + <ngram occurrences="8" value="çäèìè" /> + <ngram occurrences="8" value="çäèì" /> + <ngram occurrences="8" value="ç_è" /> + <ngram occurrences="8" value="äèìèï" /> + <ngram occurrences="8" value="äèìè" /> + <ngram occurrences="8" value="äèì" /> + <ngram occurrences="8" value="äå" /> + <ngram occurrences="8" value="º" /> + <ngram occurrences="8" value="¹ø_ù_" /> + <ngram occurrences="8" value="¹ø_ù" /> + <ngram occurrences="8" value="_ø¨ø¹" /> + <ngram occurrences="8" value="_çäèì" /> + <ngram occurrences="8" value="_á" /> + <ngram occurrences="7" value="ù_øµ" /> + <ngram occurrences="7" value="ù_øª_" /> + <ngram occurrences="7" value="ø¹_ø_" /> + <ngram occurrences="7" value="ø¹_ø" /> + <ngram occurrences="7" value="øµø" /> + <ngram occurrences="7" value="ø³ø_" /> + <ngram occurrences="7" value="ðç_" /> + <ngram occurrences="7" value="ï_çä" /> + <ngram occurrences="7" value="ï_ç" /> + <ngram occurrences="7" value="íç" /> + <ngram occurrences="7" value="êæ" /> + <ngram occurrences="7" value="èæ" /> + <ngram occurrences="7" value="çäå" /> + <ngram occurrences="7" value="ç_å" /> + <ngram occurrences="7" value="æ_çä" /> + <ngram occurrences="7" value="åç" /> + <ngram occurrences="7" value="åæ_" /> + <ngram occurrences="7" value="åæ" /> + <ngram occurrences="7" value="ãê" /> + <ngram occurrences="7" value="ãæ" /> + <ngram occurrences="7" value="áê" /> + <ngram occurrences="7" value="¹_ø_" /> + <ngram occurrences="7" value="¹_ø" /> + <ngram occurrences="7" value="µø" /> + <ngram occurrences="7" value="³ø_" /> + <ngram occurrences="7" value="_ù_øµ" /> + <ngram occurrences="7" value="_ø¸ø_" /> + <ngram occurrences="7" value="_ø¹_ø" /> + <ngram occurrences="7" value="_ø³ø_" /> + <ngram occurrences="7" value="_èç" /> + <ngram occurrences="7" value="_çäå" /> + <ngram occurrences="6" value="ù_ø²" /> + <ngram occurrences="6" value="øºù_" /> + <ngram occurrences="6" value="øºù" /> + <ngram occurrences="6" value="ø¹_ù_" /> + <ngram occurrences="6" value="ø¹_ù" /> + <ngram occurrences="6" value="øµù_" /> + <ngram occurrences="6" value="øµù" /> + <ngram occurrences="6" value="øª_ù_" /> + <ngram occurrences="6" value="øª_ù" /> + <ngram occurrences="6" value="ø_ø¹_" /> + <ngram occurrences="6" value="ð_" /> + <ngram occurrences="6" value="ïç" /> + <ngram occurrences="6" value="ê_ç" /> + <ngram occurrences="6" value="é_ç" /> + <ngram occurrences="6" value="èæ_" /> + <ngram occurrences="6" value="çè_" /> + <ngram occurrences="6" value="çæ_" /> + <ngram occurrences="6" value="çå" /> + <ngram occurrences="6" value="çäù" /> + <ngram occurrences="6" value="ç_ç" /> + <ngram occurrences="6" value="äù" /> + <ngram occurrences="6" value="äð" /> + <ngram occurrences="6" value="äé_" /> + <ngram occurrences="6" value="äé" /> + <ngram occurrences="6" value="ºù_" /> + <ngram occurrences="6" value="ºù" /> + <ngram occurrences="6" value="¹_ù_ø" /> + <ngram occurrences="6" value="¹_ù_" /> + <ngram occurrences="6" value="¹_ù" /> + <ngram occurrences="6" value="µù_" /> + <ngram occurrences="6" value="µù" /> + <ngram occurrences="6" value="ª_ù_" /> + <ngram occurrences="6" value="ª_ù" /> + <ngram occurrences="6" value="_ø¸ù_" /> + <ngram occurrences="6" value="_ø¸ù" /> + <ngram occurrences="6" value="_øª_ù" /> + <ngram occurrences="6" value="_çæ" /> + <ngram occurrences="6" value="_çäù" /> + <ngram occurrences="6" value="_åæ_" /> + <ngram occurrences="6" value="_åæ" /> + <ngram occurrences="6" value="_ä" /> + <ngram occurrences="5" value="¸ù_ù_" /> + <ngram occurrences="5" value="¸ù_ù" /> + <ngram occurrences="5" value="¸ø_ø_" /> + <ngram occurrences="5" value="¸ø_ø" /> + <ngram occurrences="5" value="¨ø¹ø_" /> + <ngram occurrences="5" value="¨ø¹ø" /> + <ngram occurrences="5" value="ù_ø¹_" /> + <ngram occurrences="5" value="ø¸ù_ù" /> + <ngram occurrences="5" value="ø¸ø_ø" /> + <ngram occurrences="5" value="ø¨ø¹ø" /> + <ngram occurrences="5" value="øºù_ø" /> + <ngram occurrences="5" value="øµù_ø" /> + <ngram occurrences="5" value="ø³ù_ù" /> + <ngram occurrences="5" value="ø³øªø" /> + <ngram occurrences="5" value="ø³ø_ø" /> + <ngram occurrences="5" value="ñé" /> + <ngram occurrences="5" value="ñã" /> + <ngram occurrences="5" value="ðçê" /> + <ngram occurrences="5" value="î_çä" /> + <ngram occurrences="5" value="î_ç" /> + <ngram occurrences="5" value="ë" /> + <ngram occurrences="5" value="êç_" /> + <ngram occurrences="5" value="èñ" /> + <ngram occurrences="5" value="èï_çä" /> + <ngram occurrences="5" value="èï_ç" /> + <ngram occurrences="5" value="çðç_" /> + <ngram occurrences="5" value="çðç" /> + <ngram occurrences="5" value="çð" /> + <ngram occurrences="5" value="çä_" /> + <ngram occurrences="5" value="åï" /> + <ngram occurrences="5" value="äã" /> + <ngram occurrences="5" value="ºù_ø_" /> + <ngram occurrences="5" value="ºù_ø" /> + <ngram occurrences="5" value="¹_ø_ù" /> + <ngram occurrences="5" value="µù_ø_" /> + <ngram occurrences="5" value="µù_ø" /> + <ngram occurrences="5" value="³ù_ù_" /> + <ngram occurrences="5" value="³ù_ù" /> + <ngram occurrences="5" value="³øªø" /> + <ngram occurrences="5" value="³ø_ø" /> + <ngram occurrences="5" value="_ù_ø²" /> + <ngram occurrences="5" value="_øº" /> + <ngram occurrences="5" value="_øµù_" /> + <ngram occurrences="5" value="_øµù" /> + <ngram occurrences="5" value="_øµø" /> + <ngram occurrences="5" value="_çæ_" /> + <ngram occurrences="5" value="_â" /> + <ngram occurrences="5" value="_áê" /> + <ngram occurrences="4" value="¸ù_ø_" /> + <ngram occurrences="4" value="¸ù_ø" /> + <ngram occurrences="4" value="¸ø¨ù_" /> + <ngram occurrences="4" value="¸ø¨ù" /> + <ngram occurrences="4" value="¸ø¨" /> + <ngram occurrences="4" value="ù_øµø" /> + <ngram occurrences="4" value="ø¸ù_ø" /> + <ngram occurrences="4" value="ø¸ø¨ù" /> + <ngram occurrences="4" value="ø¸ø¨" /> + <ngram occurrences="4" value="øµø_" /> + <ngram occurrences="4" value="ø³ù_ø" /> + <ngram occurrences="4" value="ø³øªù" /> + <ngram occurrences="4" value="ø²ø" /> + <ngram occurrences="4" value="ø_ø¨ù" /> +</ngrams> diff --git a/src/plugins/language/armenian.klp b/src/plugins/language/armenian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="809" value="_" /> + <ngram occurrences="355" value="³" /> + <ngram occurrences="254" value="ï" /> + <ngram occurrences="242" value="ñ" /> + <ngram occurrences="215" value="ý" /> + <ngram occurrences="196" value="á" /> + <ngram occurrences="140" value="_ï" /> + <ngram occurrences="137" value="ó" /> + <ngram occurrences="127" value="õ" /> + <ngram occurrences="125" value="ù" /> + <ngram occurrences="122" value="ï_" /> + <ngram occurrences="122" value="_ñ" /> + <ngram occurrences="107" value="ç" /> + <ngram occurrences="101" value="ý_" /> + <ngram occurrences="96" value="áõ" /> + <ngram occurrences="96" value="_ï_" /> + <ngram occurrences="95" value="ó_" /> + <ngram occurrences="94" value="é" /> + <ngram occurrences="92" value="ë" /> + <ngram occurrences="86" value="ñ_" /> + <ngram occurrences="85" value="_ó" /> + <ngram occurrences="80" value="³ý" /> + <ngram occurrences="76" value="û" /> + <ngram occurrences="75" value="í" /> + <ngram occurrences="70" value="_ó_" /> + <ngram occurrences="68" value="ã" /> + <ngram occurrences="67" value="ï³" /> + <ngram occurrences="55" value="³ï" /> + <ngram occurrences="54" value="ù_" /> + <ngram occurrences="52" value="_é" /> + <ngram occurrences="51" value="_³" /> + <ngram occurrences="50" value="ñ³" /> + <ngram occurrences="50" value="é_" /> + <ngram occurrences="48" value="í_" /> + <ngram occurrences="47" value="_ñ_" /> + <ngram occurrences="45" value="ç_" /> + <ngram occurrences="44" value="³ñ" /> + <ngram occurrences="43" value="å" /> + <ngram occurrences="43" value="_á" /> + <ngram occurrences="37" value="á_" /> + <ngram occurrences="37" value="_é_" /> + <ngram occurrences="35" value="¹" /> + <ngram occurrences="35" value="_ý" /> + <ngram occurrences="35" value="_ã" /> + <ngram occurrences="34" value="õ_" /> + <ngram occurrences="34" value="³ý_" /> + <ngram occurrences="34" value="_ù" /> + <ngram occurrences="34" value="_í" /> + <ngram occurrences="34" value="_ë" /> + <ngram occurrences="33" value="ù³" /> + <ngram occurrences="32" value="ý_ñ" /> + <ngram occurrences="32" value="ë_" /> + <ngram occurrences="31" value="áñ" /> + <ngram occurrences="31" value="³û" /> + <ngram occurrences="30" value="_ç" /> + <ngram occurrences="29" value="ý³" /> + <ngram occurrences="28" value="ã_" /> + <ngram occurrences="28" value="_ñ³" /> + <ngram occurrences="27" value="ñá" /> + <ngram occurrences="27" value="çý" /> + <ngram occurrences="26" value="ï_ó" /> + <ngram occurrences="26" value="³ï³" /> + <ngram occurrences="26" value="_í_" /> + <ngram occurrences="25" value="õù" /> + <ngram occurrences="25" value="ñ_ï" /> + <ngram occurrences="25" value="áõù" /> + <ngram occurrences="25" value="_õ" /> + <ngram occurrences="24" value="_ï_ó" /> + <ngram occurrences="23" value="û³" /> + <ngram occurrences="23" value="ï_ï" /> + <ngram occurrences="23" value="_ñ_ï" /> + <ngram occurrences="22" value="ï_ó_" /> + <ngram occurrences="22" value="éá" /> + <ngram occurrences="22" value="³ù" /> + <ngram occurrences="22" value="³_" /> + <ngram occurrences="21" value="³é" /> + <ngram occurrences="21" value="_ï³" /> + <ngram occurrences="21" value="_ï_ï" /> + <ngram occurrences="20" value="ñ_ï_" /> + <ngram occurrences="20" value="ïá" /> + <ngram occurrences="20" value="ï³ý" /> + <ngram occurrences="20" value="ï_ï_" /> + <ngram occurrences="20" value="³ë" /> + <ngram occurrences="20" value="_õ_" /> + <ngram occurrences="20" value="_ï_ó_" /> + <ngram occurrences="20" value="_ã_" /> + <ngram occurrences="19" value="õù_" /> + <ngram occurrences="19" value="ó_ó" /> + <ngram occurrences="19" value="áõù_" /> + <ngram occurrences="19" value="ß" /> + <ngram occurrences="19" value="_ó_ó" /> + <ngram occurrences="19" value="_ñ_ï_" /> + <ngram occurrences="19" value="_ï_ï_" /> + <ngram occurrences="18" value="ýá" /> + <ngram occurrences="18" value="ñï" /> + <ngram occurrences="18" value="çý_" /> + <ngram occurrences="18" value="µ" /> + <ngram occurrences="18" value="_áñ" /> + <ngram occurrences="17" value="ýù" /> + <ngram occurrences="17" value="õãû" /> + <ngram occurrences="17" value="õã" /> + <ngram occurrences="17" value="ó_ó_" /> + <ngram occurrences="17" value="ñç" /> + <ngram occurrences="17" value="ë³" /> + <ngram occurrences="17" value="ãû" /> + <ngram occurrences="17" value="áõãû" /> + <ngram occurrences="17" value="áõã" /> + <ngram occurrences="17" value="_ó_ó_" /> + <ngram occurrences="17" value="_ë_" /> + <ngram occurrences="16" value="½" /> + <ngram occurrences="16" value="õý" /> + <ngram occurrences="16" value="ó_ï" /> + <ngram occurrences="16" value="ï_ñ" /> + <ngram occurrences="16" value="áõý" /> + <ngram occurrences="16" value="³ï³ý" /> + <ngram occurrences="16" value="_å" /> + <ngram occurrences="15" value="ë_ï" /> + <ngram occurrences="15" value="éáõ" /> + <ngram occurrences="15" value="å³" /> + <ngram occurrences="15" value="å_" /> + <ngram occurrences="15" value="áñ_" /> + <ngram occurrences="15" value="_ý_" /> + <ngram occurrences="15" value="_ñç" /> + <ngram occurrences="15" value="_ç_" /> + <ngram occurrences="14" value="ï³ý_" /> + <ngram occurrences="14" value="ëï" /> + <ngram occurrences="14" value="_ù_" /> + <ngram occurrences="13" value="û³ý" /> + <ngram occurrences="13" value="ù³ý" /> + <ngram occurrences="13" value="³ï³ý_" /> + <ngram occurrences="13" value="_ó_ï" /> + <ngram occurrences="13" value="_ñï" /> + <ngram occurrences="13" value="_³û" /> + <ngram occurrences="12" value="ý_ñç" /> + <ngram occurrences="12" value="ùç" /> + <ngram occurrences="12" value="ó_ï_" /> + <ngram occurrences="12" value="ñáõ" /> + <ngram occurrences="12" value="ñ³ï" /> + <ngram occurrences="12" value="ëá" /> + <ngram occurrences="12" value="ë_ï_" /> + <ngram occurrences="12" value="é_ï" /> + <ngram occurrences="12" value="áõ_" /> + <ngram occurrences="12" value="_áñ_" /> + <ngram occurrences="11" value="ïáõ" /> + <ngram occurrences="11" value="í³" /> + <ngram occurrences="11" value="ç_ñ" /> + <ngram occurrences="11" value="³ó" /> + <ngram occurrences="11" value="³ï_" /> + <ngram occurrences="11" value="³å" /> + <ngram occurrences="11" value="_ó_ï_" /> + <ngram occurrences="11" value="_ï_ñ" /> + <ngram occurrences="11" value="_¹" /> + <ngram occurrences="10" value="ýó" /> + <ngram occurrences="10" value="ýáõ" /> + <ngram occurrences="10" value="ûá" /> + <ngram occurrences="10" value="õãû³" /> + <ngram occurrences="10" value="óý" /> + <ngram occurrences="10" value="ó³" /> + <ngram occurrences="10" value="ñó" /> + <ngram occurrences="10" value="ñá_" /> + <ngram occurrences="10" value="ñ³ý" /> + <ngram occurrences="10" value="ï_ó_ó" /> + <ngram occurrences="10" value="ï_ë" /> + <ngram occurrences="10" value="ãû³" /> + <ngram occurrences="10" value="ã_í" /> + <ngram occurrences="10" value="áõãû³" /> + <ngram occurrences="10" value="áí" /> + <ngram occurrences="10" value="¹³" /> + <ngram occurrences="10" value="³ñ_" /> + <ngram occurrences="10" value="³í" /> + <ngram occurrences="10" value="³éá" /> + <ngram occurrences="10" value="_ë_ï" /> + <ngram occurrences="10" value="_é_ï" /> + <ngram occurrences="9" value="ý_ñç_" /> + <ngram occurrences="9" value="ý_ï" /> + <ngram occurrences="9" value="ý_é" /> + <ngram occurrences="9" value="ûáõ" /> + <ngram occurrences="9" value="û³ý_" /> + <ngram occurrences="9" value="ù_ñ" /> + <ngram occurrences="9" value="õãû³ý" /> + <ngram occurrences="9" value="ñç_" /> + <ngram occurrences="9" value="ñ³ù" /> + <ngram occurrences="9" value="ð" /> + <ngram occurrences="9" value="ï³é" /> + <ngram occurrences="9" value="ï_ñ_" /> + <ngram occurrences="9" value="ï_é" /> + <ngram occurrences="9" value="í_ï" /> + <ngram occurrences="9" value="é_ï_" /> + <ngram occurrences="9" value="çó_" /> + <ngram occurrences="9" value="çó" /> + <ngram occurrences="9" value="ãû³ý" /> + <ngram occurrences="9" value="áí_" /> + <ngram occurrences="9" value="¹ñ" /> + <ngram occurrences="9" value="³½" /> + <ngram occurrences="9" value="³éáõ" /> + <ngram occurrences="9" value="_ù³" /> + <ngram occurrences="9" value="_ñç_" /> + <ngram occurrences="9" value="_ñá" /> + <ngram occurrences="9" value="_ïá" /> + <ngram occurrences="9" value="_ë_ï_" /> + <ngram occurrences="9" value="_é_ï_" /> + <ngram occurrences="8" value="ýý" /> + <ngram occurrences="8" value="ýù_" /> + <ngram occurrences="8" value="ýç" /> + <ngram occurrences="8" value="ýáõù" /> + <ngram occurrences="8" value="ý¹" /> + <ngram occurrences="8" value="ý³ï" /> + <ngram occurrences="8" value="ý_ù" /> + <ngram occurrences="8" value="ûáõý" /> + <ngram occurrences="8" value="ù_³" /> + <ngram occurrences="8" value="õû" /> + <ngram occurrences="8" value="ó_ñ" /> + <ngram occurrences="8" value="ó_é" /> + <ngram occurrences="8" value="ñ³ñ" /> + <ngram occurrences="8" value="ïç" /> + <ngram occurrences="8" value="ï³_" /> + <ngram occurrences="8" value="í_ó" /> + <ngram occurrences="8" value="éáõ_" /> + <ngram occurrences="8" value="ã_í_" /> + <ngram occurrences="8" value="áõû" /> + <ngram occurrences="8" value="µ_" /> + <ngram occurrences="8" value="³ýù" /> + <ngram occurrences="8" value="³ù³" /> + <ngram occurrences="8" value="³ñó" /> + <ngram occurrences="8" value="_ý³" /> + <ngram occurrences="8" value="_ñ³ù" /> + <ngram occurrences="8" value="_ï_ñ_" /> + <ngram occurrences="8" value="_ï_ë" /> + <ngram occurrences="8" value="_éá" /> + <ngram occurrences="8" value="_çý" /> + <ngram occurrences="8" value="_ã_í" /> + <ngram occurrences="8" value="_á_" /> + <ngram occurrences="8" value="_³ñ" /> + <ngram occurrences="7" value="ýáõù_" /> + <ngram occurrences="7" value="ùý" /> + <ngram occurrences="7" value="õãûáõ" /> + <ngram occurrences="7" value="õãûá" /> + <ngram occurrences="7" value="õá" /> + <ngram occurrences="7" value="õ_ñ" /> + <ngram occurrences="7" value="õ_³" /> + <ngram occurrences="7" value="ñ¹" /> + <ngram occurrences="7" value="ñ³ï³" /> + <ngram occurrences="7" value="ñ_ý" /> + <ngram occurrences="7" value="ñ_ñ" /> + <ngram occurrences="7" value="ïñ" /> + <ngram occurrences="7" value="ï³éáõ" /> + <ngram occurrences="7" value="ï³éá" /> + <ngram occurrences="7" value="ï_ï_ó" /> + <ngram occurrences="7" value="ï_ë_" /> + <ngram occurrences="7" value="ï_é_" /> + <ngram occurrences="7" value="íá" /> + <ngram occurrences="7" value="í_ó_" /> + <ngram occurrences="7" value="í_ñ" /> + <ngram occurrences="7" value="í_ï_" /> + <ngram occurrences="7" value="ê" /> + <ngram occurrences="7" value="éç" /> + <ngram occurrences="7" value="é³" /> + <ngram occurrences="7" value="çñ" /> + <ngram occurrences="7" value="ç_ñ³" /> + <ngram occurrences="7" value="ç_ï" /> + <ngram occurrences="7" value="ãûáõý" /> + <ngram occurrences="7" value="ãûáõ" /> + <ngram occurrences="7" value="ãûá" /> + <ngram occurrences="7" value="ãû³ý_" /> + <ngram occurrences="7" value="ãï³" /> + <ngram occurrences="7" value="ãï" /> + <ngram occurrences="7" value="áõãûá" /> + <ngram occurrences="7" value="á_³" /> + <ngram occurrences="7" value="³ýá" /> + <ngram occurrences="7" value="³ù_" /> + <ngram occurrences="7" value="³ñ³" /> + <ngram occurrences="7" value="³ïá" /> + <ngram occurrences="7" value="³ëï" /> + <ngram occurrences="7" value="³ß" /> + <ngram occurrences="7" value="²" /> + <ngram occurrences="7" value="_ý_ñ" /> + <ngram occurrences="7" value="_õ_³" /> + <ngram occurrences="7" value="_ó_é" /> + <ngram occurrences="7" value="_ï_ë_" /> + <ngram occurrences="7" value="_å_" /> + <ngram occurrences="7" value="_ãï³" /> + <ngram occurrences="7" value="_ãï" /> + <ngram occurrences="7" value="_áõ" /> + <ngram occurrences="7" value="_µ" /> + <ngram occurrences="6" value="¨_" /> + <ngram occurrences="6" value="¨" /> + <ngram occurrences="6" value="ýý_ñ" /> + <ngram occurrences="6" value="ýý_" /> + <ngram occurrences="6" value="ýá_" /> + <ngram occurrences="6" value="ý_ý" /> + <ngram occurrences="6" value="ý_³" /> + <ngram occurrences="6" value="ûý" /> + <ngram occurrences="6" value="ûë" /> + <ngram occurrences="6" value="ùç_" /> + <ngram occurrences="6" value="ù³ý_" /> + <ngram occurrences="6" value="ù_ý" /> + <ngram occurrences="6" value="óá" /> + <ngram occurrences="6" value="ó_ñ_" /> + <ngram occurrences="6" value="ñ³ù³" /> + <ngram occurrences="6" value="ñ_ó_" /> + <ngram occurrences="6" value="ñ_ó" /> + <ngram occurrences="6" value="ñ_é" /> + <ngram occurrences="6" value="ï³ñ" /> + <ngram occurrences="6" value="ï_í_" /> + <ngram occurrences="6" value="ï_í" /> + <ngram occurrences="6" value="ï_ç" /> + <ngram occurrences="6" value="ï_ã_" /> + <ngram occurrences="6" value="ï_ã" /> + <ngram occurrences="6" value="î" /> + <ngram occurrences="6" value="ë³ï" /> + <ngram occurrences="6" value="é_ó" /> + <ngram occurrences="6" value="é_ñ" /> + <ngram occurrences="6" value="å_ï" /> + <ngram occurrences="6" value="á_á" /> + <ngram occurrences="6" value="à" /> + <ngram occurrences="6" value="¹_" /> + <ngram occurrences="6" value="³ýç" /> + <ngram occurrences="6" value="³ý³" /> + <ngram occurrences="6" value="³ûë" /> + <ngram occurrences="6" value="³û³" /> + <ngram occurrences="6" value="³å³" /> + <ngram occurrences="6" value="_¨_" /> + <ngram occurrences="6" value="_¨" /> + <ngram occurrences="6" value="_ñ³ù³" /> + <ngram occurrences="6" value="_ñ_ó_" /> + <ngram occurrences="6" value="_ñ_ó" /> + <ngram occurrences="6" value="_ï_ç" /> + <ngram occurrences="6" value="_í_ï" /> + <ngram occurrences="6" value="_ê" /> + <ngram occurrences="6" value="_éáõ" /> + <ngram occurrences="6" value="_ã_í_" /> + <ngram occurrences="6" value="_³ý" /> + <ngram occurrences="6" value="_³ûë" /> + <ngram occurrences="5" value="½³" /> + <ngram occurrences="5" value="ýùç" /> + <ngram occurrences="5" value="ýó_" /> + <ngram occurrences="5" value="ýç_" /> + <ngram occurrences="5" value="ýã" /> + <ngram occurrences="5" value="ý³ï³ý" /> + <ngram occurrences="5" value="ý³ï³" /> + <ngram occurrences="5" value="ý_ñ_" /> + <ngram occurrences="5" value="ý_é_" /> + <ngram occurrences="5" value="ý_á" /> + <ngram occurrences="5" value="ûý_" /> + <ngram occurrences="5" value="ûó" /> + <ngram occurrences="5" value="ûñ" /> + <ngram occurrences="5" value="ùá" /> + <ngram occurrences="5" value="ù³ñ" /> + <ngram occurrences="5" value="ù_õ" /> + <ngram occurrences="5" value="ù_ñ_" /> + <ngram occurrences="5" value="õ_ï" /> + <ngram occurrences="5" value="õ_á" /> + <ngram occurrences="5" value="óý_" /> + <ngram occurrences="5" value="óç" /> + <ngram occurrences="5" value="óáõ" /> + <ngram occurrences="5" value="ó_ó_ï" /> + <ngram occurrences="5" value="ó_ñ_ï" /> + <ngram occurrences="5" value="ó_é_" /> + <ngram occurrences="5" value="ó_ç" /> + <ngram occurrences="5" value="ó_á" /> + <ngram occurrences="5" value="ñý" /> + <ngram occurrences="5" value="ñïñ" /> + <ngram occurrences="5" value="ñáõù" /> + <ngram occurrences="5" value="ñ³ñó" /> + <ngram occurrences="5" value="ïù" /> + <ngram occurrences="5" value="ïáõãû" /> + <ngram occurrences="5" value="ïáõã" /> + <ngram occurrences="5" value="ï³û" /> + <ngram occurrences="5" value="ï³ù" /> + <ngram occurrences="5" value="ï_õ_" /> + <ngram occurrences="5" value="ï_õ" /> + <ngram occurrences="5" value="ï_ï_ï" /> + <ngram occurrences="5" value="ï_ç_" /> + <ngram occurrences="5" value="íáõ" /> + <ngram occurrences="5" value="ëï_" /> + <ngram occurrences="5" value="ëáõ" /> + <ngram occurrences="5" value="ë_ã" /> + <ngram occurrences="5" value="é_ù" /> + <ngram occurrences="5" value="é_ó_" /> + <ngram occurrences="5" value="çñ_" /> + <ngram occurrences="5" value="ãï³_" /> + <ngram occurrences="5" value="áý" /> + <ngram occurrences="5" value="áë" /> + <ngram occurrences="5" value="ßë³" /> + <ngram occurrences="5" value="ßë" /> + <ngram occurrences="5" value="¹ñ³" /> + <ngram occurrences="5" value="¹á" /> + <ngram occurrences="5" value="¹³ï" /> + <ngram occurrences="5" value="³ýó" /> + <ngram occurrences="5" value="³ýá_" /> + <ngram occurrences="5" value="³ý_ù" /> + <ngram occurrences="5" value="³ý_³" /> + <ngram occurrences="5" value="³ñá" /> + <ngram occurrences="5" value="³ïáõ" /> + <ngram occurrences="5" value="³ëá" /> + <ngram occurrences="5" value="³é³" /> + <ngram occurrences="5" value="³¹" /> + <ngram occurrences="5" value="_ýù" /> + <ngram occurrences="5" value="_û" /> + <ngram occurrences="5" value="_ù_ñ_" /> +</ngrams> diff --git a/src/plugins/language/basque.klp b/src/plugins/language/basque.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="565" value="_" /> + <ngram occurrences="563" value="a" /> + <ngram occurrences="434" value="e" /> + <ngram occurrences="346" value="i" /> + <ngram occurrences="284" value="t" /> + <ngram occurrences="262" value="n" /> + <ngram occurrences="253" value="r" /> + <ngram occurrences="204" value="k" /> + <ngram occurrences="197" value="o" /> + <ngram occurrences="177" value="z" /> + <ngram occurrences="163" value="u" /> + <ngram occurrences="139" value="d" /> + <ngram occurrences="124" value="a_" /> + <ngram occurrences="120" value="n_" /> + <ngram occurrences="113" value="s" /> + <ngram occurrences="110" value="b" /> + <ngram occurrences="103" value="l" /> + <ngram occurrences="96" value="_e" /> + <ngram occurrences="91" value="g" /> + <ngram occurrences="87" value="en" /> + <ngram occurrences="73" value="er" /> + <ngram occurrences="70" value="_b" /> + <ngram occurrences="68" value="ta" /> + <ngram occurrences="67" value="o_" /> + <ngram occurrences="67" value="ko" /> + <ngram occurrences="66" value="ra" /> + <ngram occurrences="66" value="at" /> + <ngram occurrences="66" value="_d" /> + <ngram occurrences="62" value="h" /> + <ngram occurrences="59" value="te" /> + <ngram occurrences="57" value="en_" /> + <ngram occurrences="57" value="ar" /> + <ngram occurrences="56" value="an" /> + <ngram occurrences="54" value="_a" /> + <ngram occurrences="53" value="tz" /> + <ngram occurrences="53" value="m" /> + <ngram occurrences="52" value="ik" /> + <ngram occurrences="49" value="p" /> + <ngram occurrences="47" value="k_" /> + <ngram occurrences="46" value="ri" /> + <ngram occurrences="46" value="an_" /> + <ngram occurrences="46" value="al" /> + <ngram occurrences="45" value="ze" /> + <ngram occurrences="44" value="in" /> + <ngram occurrences="43" value="e_" /> + <ngram occurrences="41" value="ko_" /> + <ngram occurrences="41" value="it" /> + <ngram occurrences="41" value="ba" /> + <ngram occurrences="40" value="ka" /> + <ngram occurrences="40" value="i_" /> + <ngram occurrences="39" value="de" /> + <ngram occurrences="38" value="za" /> + <ngram occurrences="38" value="ez" /> + <ngram occurrences="38" value="ak" /> + <ngram occurrences="38" value="ai" /> + <ngram occurrences="37" value="re" /> + <ngram occurrences="35" value="z_" /> + <ngram occurrences="35" value="tu" /> + <ngram occurrences="35" value="da" /> + <ngram occurrences="34" value="rr" /> + <ngram occurrences="34" value="di" /> + <ngram occurrences="33" value="et" /> + <ngram occurrences="32" value="be" /> + <ngram occurrences="31" value="tze" /> + <ngram occurrences="31" value="ti" /> + <ngram occurrences="31" value="na" /> + <ngram occurrences="31" value="eta" /> + <ngram occurrences="31" value="_ba" /> + <ngram occurrences="30" value="iz" /> + <ngram occurrences="30" value="_h" /> + <ngram occurrences="29" value="un" /> + <ngram occurrences="29" value="ia" /> + <ngram occurrences="28" value="nt" /> + <ngram occurrences="28" value="es" /> + <ngram occurrences="28" value="_i" /> + <ngram occurrences="27" value="_k" /> + <ngram occurrences="27" value="_g" /> + <ngram occurrences="26" value="la" /> + <ngram occurrences="26" value="_be" /> + <ngram occurrences="24" value="rt" /> + <ngram occurrences="24" value="or" /> + <ngram occurrences="24" value="ha" /> + <ngram occurrences="24" value="go" /> + <ngram occurrences="24" value="az" /> + <ngram occurrences="23" value="zk" /> + <ngram occurrences="23" value="zen" /> + <ngram occurrences="23" value="ta_" /> + <ngram occurrences="23" value="sk" /> + <ngram occurrences="23" value="era" /> + <ngram occurrences="23" value="_n" /> + <ngram occurrences="22" value="ur" /> + <ngram occurrences="22" value="u_" /> + <ngram occurrences="22" value="st" /> + <ngram occurrences="22" value="n_e" /> + <ngram occurrences="22" value="bi" /> + <ngram occurrences="22" value="_de" /> + <ngram occurrences="21" value="tik" /> + <ngram occurrences="21" value="t_" /> + <ngram occurrences="21" value="rri" /> + <ngram occurrences="21" value="n_d" /> + <ngram occurrences="21" value="ma" /> + <ngram occurrences="21" value="ke" /> + <ngram occurrences="21" value="as" /> + <ngram occurrences="21" value="a_e" /> + <ngram occurrences="20" value="oa" /> + <ngram occurrences="20" value="ik_" /> + <ngram occurrences="20" value="eg" /> + <ngram occurrences="20" value="_l" /> + <ngram occurrences="20" value="_da" /> + <ngram occurrences="19" value="si" /> + <ngram occurrences="19" value="on" /> + <ngram occurrences="19" value="nd" /> + <ngram occurrences="19" value="li" /> + <ngram occurrences="19" value="hi" /> + <ngram occurrences="19" value="_p" /> + <ngram occurrences="18" value="us" /> + <ngram occurrences="18" value="le" /> + <ngram occurrences="18" value="gi" /> + <ngram occurrences="18" value="eta_" /> + <ngram occurrences="18" value="du" /> + <ngram occurrences="18" value="ag" /> + <ngram occurrences="18" value="_o" /> + <ngram occurrences="17" value="zen_" /> + <ngram occurrences="17" value="il" /> + <ngram occurrences="17" value="ez_" /> + <ngram occurrences="17" value="au" /> + <ngram occurrences="17" value="ak_" /> + <ngram occurrences="16" value="ek" /> + <ngram occurrences="16" value="a_d" /> + <ngram occurrences="16" value="_m" /> + <ngram occurrences="16" value="_ez" /> + <ngram occurrences="16" value="_eta_" /> + <ngram occurrences="16" value="_eta" /> + <ngram occurrences="16" value="_et" /> + <ngram occurrences="15" value="ska" /> + <ngram occurrences="15" value="r_" /> + <ngram occurrences="15" value="ntz" /> + <ngram occurrences="15" value="ng" /> + <ngram occurrences="15" value="iko" /> + <ngram occurrences="15" value="ea" /> + <ngram occurrences="15" value="ati" /> + <ngram occurrences="15" value="ate" /> + <ngram occurrences="15" value="ab" /> + <ngram occurrences="15" value="_z" /> + <ngram occurrences="14" value="zt" /> + <ngram occurrences="14" value="uska" /> + <ngram occurrences="14" value="usk" /> + <ngram occurrences="14" value="tzen_" /> + <ngram occurrences="14" value="tzen" /> + <ngram occurrences="14" value="tza" /> + <ngram occurrences="14" value="tu_" /> + <ngram occurrences="14" value="tan_" /> + <ngram occurrences="14" value="tan" /> + <ngram occurrences="14" value="na_" /> + <ngram occurrences="14" value="ki" /> + <ngram occurrences="14" value="euska" /> + <ngram occurrences="14" value="eusk" /> + <ngram occurrences="14" value="eus" /> + <ngram occurrences="14" value="eu" /> + <ngram occurrences="14" value="en_d" /> + <ngram occurrences="14" value="egi" /> + <ngram occurrences="14" value="a_a" /> + <ngram occurrences="14" value="_ko" /> + <ngram occurrences="14" value="_eusk" /> + <ngram occurrences="14" value="_eus" /> + <ngram occurrences="14" value="_eu" /> + <ngram occurrences="13" value="zi" /> + <ngram occurrences="13" value="ren" /> + <ngram occurrences="13" value="os" /> + <ngram occurrences="13" value="ni" /> + <ngram occurrences="13" value="n_a" /> + <ngram occurrences="13" value="itz" /> + <ngram occurrences="13" value="is" /> + <ngram occurrences="13" value="ir" /> + <ngram occurrences="13" value="ika" /> + <ngram occurrences="13" value="id" /> + <ngram occurrences="13" value="f" /> + <ngram occurrences="13" value="ber" /> + <ngram occurrences="13" value="bat" /> + <ngram occurrences="13" value="_er" /> + <ngram occurrences="13" value="_bat" /> + <ngram occurrences="12" value="uz" /> + <ngram occurrences="12" value="ua" /> + <ngram occurrences="12" value="ot" /> + <ngram occurrences="12" value="no" /> + <ngram occurrences="12" value="ib" /> + <ngram occurrences="12" value="ga" /> + <ngram occurrences="12" value="ert" /> + <ngram occurrences="12" value="ere" /> + <ngram occurrences="12" value="ep" /> + <ngram occurrences="12" value="eh" /> + <ngram occurrences="12" value="bil" /> + <ngram occurrences="12" value="bai" /> + <ngram occurrences="12" value="atz" /> + <ngram occurrences="12" value="ara" /> + <ngram occurrences="12" value="am" /> + <ngram occurrences="12" value="ah" /> + <ngram occurrences="12" value="_u" /> + <ngram occurrences="12" value="_eg" /> + <ngram occurrences="12" value="_di" /> + <ngram occurrences="11" value="ste" /> + <ngram occurrences="11" value="pe" /> + <ngram occurrences="11" value="o_e" /> + <ngram occurrences="11" value="o_b" /> + <ngram occurrences="11" value="ne" /> + <ngram occurrences="11" value="n_b" /> + <ngram occurrences="11" value="mat" /> + <ngram occurrences="11" value="kal" /> + <ngram occurrences="11" value="ie" /> + <ngram occurrences="11" value="he" /> + <ngram occurrences="11" value="gu" /> + <ngram occurrences="11" value="ge" /> + <ngram occurrences="11" value="err" /> + <ngram occurrences="11" value="el" /> + <ngram occurrences="11" value="eko_" /> + <ngram occurrences="11" value="eko" /> + <ngram occurrences="11" value="do" /> + <ngram occurrences="11" value="da_" /> + <ngram occurrences="11" value="c" /> + <ngram occurrences="11" value="atik" /> + <ngram occurrences="11" value="at_" /> + <ngram occurrences="11" value="arr" /> + <ngram occurrences="11" value="an_e" /> + <ngram occurrences="11" value="ait" /> + <ngram occurrences="11" value="ain" /> + <ngram occurrences="11" value="_ha" /> + <ngram occurrences="10" value="ut" /> + <ngram occurrences="10" value="ue" /> + <ngram occurrences="10" value="te_" /> + <ngram occurrences="10" value="ren_" /> + <ngram occurrences="10" value="pa" /> + <ngram occurrences="10" value="oa_" /> + <ngram occurrences="10" value="ntze" /> + <ngram occurrences="10" value="mo" /> + <ngram occurrences="10" value="mati" /> + <ngram occurrences="10" value="ld" /> + <ngram occurrences="10" value="la_" /> + <ngram occurrences="10" value="ke_" /> + <ngram occurrences="10" value="k_e" /> + <ngram occurrences="10" value="in_" /> + <ngram occurrences="10" value="ia_" /> + <ngram occurrences="10" value="go_" /> + <ngram occurrences="10" value="e_b" /> + <ngram occurrences="10" value="atu" /> + <ngram occurrences="10" value="ari" /> + <ngram occurrences="10" value="ama" /> + <ngram occurrences="10" value="ald" /> + <ngram occurrences="10" value="ago" /> + <ngram occurrences="10" value="ad" /> + <ngram occurrences="10" value="abi" /> + <ngram occurrences="10" value="a_k" /> + <ngram occurrences="10" value="a_de" /> + <ngram occurrences="10" value="a_b" /> + <ngram occurrences="10" value="_t" /> + <ngram occurrences="10" value="_s" /> + <ngram occurrences="10" value="_na" /> + <ngram occurrences="10" value="_iz" /> + <ngram occurrences="10" value="_ber" /> + <ngram occurrences="9" value="zte" /> + <ngram occurrences="9" value="zko" /> + <ngram occurrences="9" value="zke" /> + <ngram occurrences="9" value="v" /> + <ngram occurrences="9" value="uk" /> + <ngram occurrences="9" value="ter" /> + <ngram occurrences="9" value="su" /> + <ngram occurrences="9" value="sa" /> + <ngram occurrences="9" value="s_" /> + <ngram occurrences="9" value="ru" /> + <ngram occurrences="9" value="rik_" /> + <ngram occurrences="9" value="rik" /> + <ngram occurrences="9" value="ria" /> + <ngram occurrences="9" value="ri_" /> + <ngram occurrences="9" value="raz" /> + <ngram occurrences="9" value="rabil" /> + <ngram occurrences="9" value="rabi" /> + <ngram occurrences="9" value="rab" /> + <ngram occurrences="9" value="ra_" /> + <ngram occurrences="9" value="mu" /> + <ngram occurrences="9" value="matik" /> + <ngram occurrences="9" value="kon" /> + <ngram occurrences="9" value="koa" /> + <ngram occurrences="9" value="ing" /> + <ngram occurrences="9" value="i_d" /> + <ngram occurrences="9" value="har" /> + <ngram occurrences="9" value="erri" /> + <ngram occurrences="9" value="erabi" /> + <ngram occurrences="9" value="erab" /> + <ngram occurrences="9" value="ena" /> + <ngram occurrences="9" value="ed" /> + <ngram occurrences="9" value="ea_" /> + <ngram occurrences="9" value="ala" /> + <ngram occurrences="9" value="ako" /> + <ngram occurrences="9" value="abil" /> + <ngram occurrences="9" value="_ze" /> + <ngram occurrences="9" value="_kon" /> + <ngram occurrences="9" value="_ge" /> + <ngram occurrences="9" value="_erab" /> + <ngram occurrences="9" value="_era" /> + <ngram occurrences="9" value="_egi" /> + <ngram occurrences="9" value="_du" /> + <ngram occurrences="9" value="_da_" /> + <ngram occurrences="8" value="zeptu" /> + <ngram occurrences="8" value="zept" /> + <ngram occurrences="8" value="zep" /> + <ngram occurrences="8" value="zen_d" /> + <ngram occurrences="8" value="zat" /> + <ngram occurrences="8" value="zan_" /> + <ngram occurrences="8" value="zan" /> + <ngram occurrences="8" value="uskal" /> + <ngram occurrences="8" value="tzept" /> + <ngram occurrences="8" value="tzep" /> + <ngram occurrences="8" value="ts" /> + <ngram occurrences="8" value="tiko" /> + <ngram occurrences="8" value="tika" /> + <ngram occurrences="8" value="ten_" /> + <ngram occurrences="8" value="ten" /> + <ngram occurrences="8" value="tat" /> + <ngram occurrences="8" value="skal" /> + <ngram occurrences="8" value="ro" /> + <ngram occurrences="8" value="ram" /> + <ngram occurrences="8" value="rak" /> + <ngram occurrences="8" value="ptu" /> + <ngram occurrences="8" value="pt" /> + <ngram occurrences="8" value="pen" /> + <ngram occurrences="8" value="orr" /> + <ngram occurrences="8" value="ontze" /> + <ngram occurrences="8" value="ontz" /> + <ngram occurrences="8" value="ont" /> + <ngram occurrences="8" value="ntzep" /> + <ngram occurrences="8" value="ndi" /> + <ngram occurrences="8" value="nah" /> + <ngram occurrences="8" value="lt" /> + <ngram occurrences="8" value="l_" /> + <ngram occurrences="8" value="kontz" /> + <ngram occurrences="8" value="kont" /> + <ngram occurrences="8" value="kar" /> + <ngram occurrences="8" value="izk" /> + <ngram occurrences="8" value="iza" /> + <ngram occurrences="8" value="itu" /> + <ngram occurrences="8" value="ita" /> + <ngram occurrences="8" value="ist" /> + <ngram occurrences="8" value="io" /> + <ngram occurrences="8" value="gram" /> + <ngram occurrences="8" value="gra" /> + <ngram occurrences="8" value="gr" /> + <ngram occurrences="8" value="ger" /> + <ngram occurrences="8" value="eza" /> + <ngram occurrences="8" value="est" /> + <ngram occurrences="8" value="eptu" /> + <ngram occurrences="8" value="ept" /> + <ngram occurrences="8" value="ena_" /> + <ngram occurrences="8" value="en_e" /> + <ngram occurrences="8" value="em" /> + <ngram occurrences="8" value="ela" /> + <ngram occurrences="8" value="azte" /> + <ngram occurrences="8" value="azt" /> + <ngram occurrences="8" value="atze" /> + <ngram occurrences="8" value="ar_" /> + <ngram occurrences="8" value="_kont" /> + <ngram occurrences="8" value="_hi" /> + <ngram occurrences="8" value="_gram" /> + <ngram occurrences="8" value="_gra" /> + <ngram occurrences="8" value="_gr" /> + <ngram occurrences="8" value="_ez_" /> + <ngram occurrences="8" value="_ed" /> + <ngram occurrences="8" value="_bi" /> + <ngram occurrences="8" value="_bai" /> + <ngram occurrences="8" value="_az" /> + <ngram occurrences="8" value="_a_" /> + <ngram occurrences="7" value="zu" /> + <ngram occurrences="7" value="zko_" /> + <ngram occurrences="7" value="z_d" /> + <ngram occurrences="7" value="und" /> + <ngram occurrences="7" value="tek" /> + <ngram occurrences="7" value="tak" /> + <ngram occurrences="7" value="res" /> + <ngram occurrences="7" value="re_" /> + <ngram occurrences="7" value="ramat" /> + <ngram occurrences="7" value="rama" /> + <ngram occurrences="7" value="pr" /> + <ngram occurrences="7" value="ok" /> + <ngram occurrences="7" value="o_h" /> + <ngram occurrences="7" value="o_a" /> + <ngram occurrences="7" value="nahi" /> + <ngram occurrences="7" value="lde" /> + <ngram occurrences="7" value="kat" /> + <ngram occurrences="7" value="k_b" /> + <ngram occurrences="7" value="j" /> + <ngram occurrences="7" value="izan_" /> + <ngram occurrences="7" value="izan" /> + <ngram occurrences="7" value="ite" /> + <ngram occurrences="7" value="int" /> + <ngram occurrences="7" value="iko_" /> + <ngram occurrences="7" value="ide" /> + <ngram occurrences="7" value="hiz" /> + <ngram occurrences="7" value="hi_" /> + <ngram occurrences="7" value="grama" /> + <ngram occurrences="7" value="ezk" /> + <ngram occurrences="7" value="en_a" /> + <ngram occurrences="7" value="edo" /> +</ngrams> diff --git a/src/plugins/language/belarus.klp b/src/plugins/language/belarus.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="596" value="_" /> + <ngram occurrences="541" value="à" /> + <ngram occurrences="249" value="í" /> + <ngram occurrences="189" value="i" /> + <ngram occurrences="183" value="ð" /> + <ngram occurrences="170" value="ê" /> + <ngram occurrences="159" value="å" /> + <ngram occurrences="156" value="ó" /> + <ngram occurrences="154" value="û" /> + <ngram occurrences="142" value="ë" /> + <ngram occurrences="128" value="ñ" /> + <ngram occurrences="126" value="à_" /> + <ngram occurrences="115" value="ò" /> + <ngram occurrences="111" value="ÿ" /> + <ngram occurrences="107" value="ì" /> + <ngram occurrences="99" value="â" /> + <ngram occurrences="97" value="ä" /> + <ngram occurrences="94" value="î" /> + <ngram occurrences="80" value="i_" /> + <ngram occurrences="76" value="ï" /> + <ngram occurrences="75" value="ö" /> + <ngram occurrences="75" value="ç" /> + <ngram occurrences="71" value="ó_" /> + <ngram occurrences="68" value="íà" /> + <ngram occurrences="65" value="êà" /> + <ngram occurrences="63" value="ã" /> + <ngram occurrences="58" value="_à" /> + <ngram occurrences="53" value="û_" /> + <ngram occurrences="53" value="àë" /> + <ngram occurrences="52" value="ðà" /> + <ngram occurrences="51" value="àð" /> + <ngram occurrences="49" value="ý" /> + <ngram occurrences="46" value="á" /> + <ngram occurrences="46" value="àí" /> + <ngram occurrences="45" value="âà" /> + <ngram occurrences="45" value="_ï" /> + <ngram occurrences="44" value="ÿ_" /> + <ngram occurrences="44" value="òà" /> + <ngram occurrences="40" value="_ó" /> + <ngram occurrences="39" value="_ñ" /> + <ngram occurrences="39" value="_ì" /> + <ngram occurrences="39" value="_â" /> + <ngram occurrences="36" value="ëà" /> + <ngram occurrences="36" value="é" /> + <ngram occurrences="36" value="å_" /> + <ngram occurrences="36" value="_í" /> + <ngram occurrences="34" value="ø" /> + <ngram occurrences="33" value="_i" /> + <ngram occurrences="32" value="ãà" /> + <ngram occurrences="32" value="_ã" /> + <ngram occurrences="31" value="ü" /> + <ngram occurrences="31" value="àä" /> + <ngram occurrences="30" value="ðû" /> + <ngram occurrences="29" value="íû" /> + <ngram occurrences="29" value="ëå" /> + <ngram occurrences="29" value="_ä" /> + <ngram occurrences="28" value="é_" /> + <ngram occurrences="28" value="_ê" /> + <ngram occurrences="27" value="íà_" /> + <ngram occurrences="27" value="_ó_" /> + <ngram occurrences="27" value="_á" /> + <ngram occurrences="26" value="òû" /> + <ngram occurrences="26" value="_ç" /> + <ngram occurrences="25" value="õ" /> + <ngram occurrences="25" value="ïà" /> + <ngram occurrences="25" value="ëi" /> + <ngram occurrences="25" value="çå" /> + <ngram occurrences="25" value="äà" /> + <ngram occurrences="24" value="ñê" /> + <ngram occurrences="24" value="ì_" /> + <ngram occurrences="24" value="êi" /> + <ngram occurrences="23" value="ðî" /> + <ngram occurrences="23" value="ïð" /> + <ngram occurrences="22" value="íi" /> + <ngram occurrences="22" value="åí" /> + <ngram occurrences="22" value="_i_" /> + <ngram occurrences="21" value="ñò" /> + <ngram occurrences="21" value="êó" /> + <ngram occurrences="21" value="çà" /> + <ngram occurrences="21" value="àì" /> + <ngram occurrences="21" value="àâ" /> + <ngram occurrences="20" value="àñ" /> + <ngram occurrences="20" value="àê" /> + <ngram occurrences="20" value="àé" /> + <ngram occurrences="20" value="_ïà" /> + <ngram occurrences="19" value="ìi" /> + <ngram occurrences="19" value="àç" /> + <ngram occurrences="19" value="iê" /> + <ngram occurrences="19" value="_íà" /> + <ngram occurrences="18" value="þ" /> + <ngram occurrences="18" value="ûÿ" /> + <ngram occurrences="18" value="î_" /> + <ngram occurrences="18" value="íñ" /> + <ngram occurrences="18" value="ìà" /> + <ngram occurrences="18" value="ëü" /> + <ngram occurrences="18" value="æ" /> + <ngram occurrences="18" value="äç" /> + <ngram occurrences="18" value="àó" /> + <ngram occurrences="18" value="àé_" /> + <ngram occurrences="18" value="àã" /> + <ngram occurrences="18" value="ií" /> + <ngram occurrences="17" value="õ_" /> + <ngram occurrences="17" value="íí" /> + <ngram occurrences="17" value="âå" /> + <ngram occurrences="17" value="àëå" /> + <ngram occurrences="17" value="à_ï" /> + <ngram occurrences="17" value="_ð" /> + <ngram occurrences="17" value="_ïð" /> + <ngram occurrences="16" value="öû" /> + <ngram occurrences="16" value="ñà" /> + <ngram occurrences="16" value="ðó" /> + <ngram occurrences="16" value="íÿ" /> + <ngram occurrences="16" value="íû_" /> + <ngram occurrences="16" value="íñê" /> + <ngram occurrences="16" value="ìå" /> + <ngram occurrences="16" value="åò" /> + <ngram occurrences="16" value="åð" /> + <ngram occurrences="15" value="ÿí" /> + <ngram occurrences="15" value="ü_" /> + <ngram occurrences="15" value="ûí" /> + <ngram occurrences="15" value="òàð" /> + <ngram occurrences="15" value="ð_" /> + <ngram occurrences="15" value="äçå" /> + <ngram occurrences="15" value="àëà" /> + <ngram occurrences="15" value="àâà" /> + <ngram occurrences="15" value="_êà" /> + <ngram occurrences="15" value="_ãà" /> + <ngram occurrences="14" value="ûì" /> + <ngram occurrences="14" value="ðý" /> + <ngram occurrences="14" value="íê" /> + <ngram occurrences="14" value="íå" /> + <ngram occurrences="14" value="ëÿ" /> + <ngram occurrences="14" value="àö" /> + <ngram occurrences="14" value="à_ó" /> + <ngram occurrences="14" value="_ÿ" /> + <ngram occurrences="13" value="öà" /> + <ngram occurrences="13" value="îí" /> + <ngram occurrences="13" value="êó_" /> + <ngram occurrences="13" value="êò" /> + <ngram occurrences="13" value="êi_" /> + <ngram occurrences="13" value="âi" /> + <ngram occurrences="13" value="àíà" /> + <ngram occurrences="13" value="à_ó_" /> + <ngram occurrences="13" value="à_ñ" /> + <ngram occurrences="12" value="ÿê" /> + <ngram occurrences="12" value="òð" /> + <ngram occurrences="12" value="òà_" /> + <ngram occurrences="12" value="ñêà" /> + <ngram occurrences="12" value="ñi" /> + <ngram occurrences="12" value="ðí" /> + <ngram occurrences="12" value="ëi_" /> + <ngram occurrences="12" value="êàë" /> + <ngram occurrences="12" value="êà_" /> + <ngram occurrences="12" value="ç_" /> + <ngram occurrences="12" value="åê" /> + <ngram occurrences="12" value="äà_" /> + <ngram occurrences="12" value="ãî" /> + <ngram occurrences="12" value="ãà_" /> + <ngram occurrences="12" value="àÿ_" /> + <ngram occurrences="12" value="àÿ" /> + <ngram occurrences="12" value="àò" /> + <ngram occurrences="12" value="àï" /> + <ngram occurrences="12" value="àãà_" /> + <ngram occurrences="12" value="àãà" /> + <ngram occurrences="12" value="ië" /> + <ngram occurrences="12" value="_ý" /> + <ngram occurrences="12" value="_ò" /> + <ngram occurrences="12" value="_çà" /> + <ngram occurrences="12" value="_âà" /> + <ngram occurrences="11" value="û_â" /> + <ngram occurrences="11" value="òû_" /> + <ngram occurrences="11" value="ñö" /> + <ngram occurrences="11" value="ñâ" /> + <ngram occurrences="11" value="ïðà" /> + <ngram occurrences="11" value="ïi" /> + <ngram occurrences="11" value="êî" /> + <ngram occurrences="11" value="åö" /> + <ngram occurrences="11" value="åë" /> + <ngram occurrences="11" value="âÿ" /> + <ngram occurrences="11" value="i_à" /> + <ngram occurrences="11" value="_íà_" /> + <ngram occurrences="11" value="_ç_" /> + <ngram occurrences="11" value="_å" /> + <ngram occurrences="10" value="ûì_" /> + <ngram occurrences="10" value="øû" /> + <ngram occurrences="10" value="öi" /> + <ngram occurrences="10" value="ñÿ" /> + <ngram occurrences="10" value="îó" /> + <ngram occurrences="10" value="îð" /> + <ngram occurrences="10" value="ëåê" /> + <ngram occurrences="10" value="è" /> + <ngram occurrences="10" value="äð" /> + <ngram occurrences="10" value="ãàçå" /> + <ngram occurrences="10" value="ãàç" /> + <ngram occurrences="10" value="âû" /> + <ngram occurrences="10" value="âàí" /> + <ngram occurrences="10" value="àðû" /> + <ngram occurrences="10" value="àðà" /> + <ngram occurrences="10" value="àçå" /> + <ngram occurrences="10" value="à_à" /> + <ngram occurrences="10" value="iêà" /> + <ngram occurrences="10" value="_ìi" /> + <ngram occurrences="10" value="_ãàçå" /> + <ngram occurrences="10" value="_ãàç" /> + <ngram occurrences="10" value="_âå" /> + <ngram occurrences="10" value="_àä" /> + <ngram occurrences="9" value="ûÿ_" /> + <ngram occurrences="9" value="öå" /> + <ngram occurrences="9" value="ô" /> + <ngram occurrences="9" value="óñ" /> + <ngram occurrences="9" value="óí" /> + <ngram occurrences="9" value="ó_ã" /> + <ngram occurrences="9" value="ó_à" /> + <ngram occurrences="9" value="ñòà" /> + <ngram occurrences="9" value="ðàä" /> + <ngram occurrences="9" value="îâ" /> + <ngram occurrences="9" value="íò" /> + <ngram occurrences="9" value="ëî" /> + <ngram occurrences="9" value="âàð" /> + <ngram occurrences="9" value="àð_" /> + <ngram occurrences="9" value="àëi" /> + <ngram occurrences="9" value="àâàí" /> + <ngram occurrences="9" value="_ìå" /> + <ngram occurrences="9" value="_äà" /> + <ngram occurrences="9" value="_àë" /> + <ngram occurrences="8" value="ÿ_à" /> + <ngram occurrences="8" value="ýë" /> + <ngram occurrences="8" value="ûê" /> + <ngram occurrences="8" value="ø_" /> + <ngram occurrences="8" value="öà_" /> + <ngram occurrences="8" value="óê" /> + <ngram occurrences="8" value="ó_í" /> + <ngram occurrences="8" value="ëà_" /> + <ngram occurrences="8" value="ê_" /> + <ngram occurrences="8" value="çå_" /> + <ngram occurrences="8" value="äçå_" /> + <ngram occurrences="8" value="ä_" /> + <ngram occurrences="8" value="áû" /> + <ngram occurrences="8" value="àó_" /> + <ngram occurrences="8" value="à_ó_ã" /> + <ngram occurrences="8" value="à_ïà" /> + <ngram occurrences="8" value="à_â" /> + <ngram occurrences="8" value="iì" /> + <ngram occurrences="8" value="i_ó" /> + <ngram occurrences="8" value="_û" /> + <ngram occurrences="8" value="_ø" /> + <ngram occurrences="8" value="_ô" /> + <ngram occurrences="8" value="_ó_ã" /> + <ngram occurrences="8" value="_ñâ" /> + <ngram occurrences="8" value="_ñà" /> + <ngram occurrences="8" value="_ïðà" /> + <ngram occurrences="8" value="_ìà" /> + <ngram occurrences="8" value="_ë" /> + <ngram occurrences="8" value="_åð" /> + <ngram occurrences="7" value="ýì" /> + <ngram occurrences="7" value="ýä" /> + <ngram occurrences="7" value="ûÿí" /> + <ngram occurrences="7" value="ûë" /> + <ngram occurrences="7" value="öå_" /> + <ngram occurrences="7" value="öi_" /> + <ngram occurrences="7" value="óð" /> + <ngram occurrences="7" value="óä" /> + <ngram occurrences="7" value="ó_ï" /> + <ngram occurrences="7" value="òû_â" /> + <ngram occurrences="7" value="òðî" /> + <ngram occurrences="7" value="ñàí" /> + <ngram occurrences="7" value="ðýä" /> + <ngram occurrences="7" value="ðîí" /> + <ngram occurrences="7" value="ðàí" /> + <ngram occurrences="7" value="ïðû" /> + <ngram occurrences="7" value="ïà_" /> + <ngram occurrences="7" value="íÿ_" /> + <ngram occurrences="7" value="íûÿ_" /> + <ngram occurrences="7" value="íûÿ" /> + <ngram occurrences="7" value="íî" /> + <ngram occurrences="7" value="íêà_" /> + <ngram occurrences="7" value="íêà" /> + <ngram occurrences="7" value="í_" /> + <ngram occurrences="7" value="ìï" /> + <ngram occurrences="7" value="ìií" /> + <ngram occurrences="7" value="ëÿ_" /> + <ngram occurrences="7" value="êòàð" /> + <ngram occurrences="7" value="êòà" /> + <ngram occurrences="7" value="êñ" /> + <ngram occurrences="7" value="êð" /> + <ngram occurrences="7" value="êàé_" /> + <ngram occurrences="7" value="êàé" /> + <ngram occurrences="7" value="çåò" /> + <ngram occurrences="7" value="åñ" /> + <ngram occurrences="7" value="åðí" /> + <ngram occurrences="7" value="äí" /> + <ngram occurrences="7" value="äàê" /> + <ngram occurrences="7" value="ãó" /> + <ngram occurrences="7" value="âàë" /> + <ngram occurrences="7" value="âà_" /> + <ngram occurrences="7" value="àø" /> + <ngram occurrences="7" value="àì_" /> + <ngram occurrences="7" value="àå" /> + <ngram occurrences="7" value="àäç" /> + <ngram occurrences="7" value="à_ã" /> + <ngram occurrences="7" value="ß" /> + <ngram occurrences="7" value="ið" /> + <ngram occurrences="7" value="_ýë" /> + <ngram occurrences="7" value="_ðý" /> + <ngram occurrences="7" value="_ïðû" /> + <ngram occurrences="7" value="_ïà_" /> + <ngram occurrences="7" value="_ìií" /> + <ngram occurrences="7" value="_êî" /> + <ngram occurrences="7" value="_êàë" /> + <ngram occurrences="7" value="_åðí" /> + <ngram occurrences="7" value="_âû" /> + <ngram occurrences="7" value="_âàð" /> + <ngram occurrences="7" value="_áû" /> + <ngram occurrences="7" value="_àê" /> + <ngram occurrences="7" value="_ß" /> + <ngram occurrences="6" value="ÿó_" /> + <ngram occurrences="6" value="ÿó" /> + <ngram occurrences="6" value="ÿíà" /> + <ngram occurrences="6" value="þ_" /> + <ngram occurrences="6" value="ýí" /> + <ngram occurrences="6" value="ýëåêò" /> + <ngram occurrences="6" value="ýëåê" /> + <ngram occurrences="6" value="ýëå" /> + <ngram occurrences="6" value="ýäàê" /> + <ngram occurrences="6" value="ýäà" /> + <ngram occurrences="6" value="üí" /> + <ngram occurrences="6" value="ûö" /> + <ngram occurrences="6" value="û_âå_" /> + <ngram occurrences="6" value="û_âå" /> + <ngram occurrences="6" value="øû_" /> + <ngram occurrences="6" value="öü_" /> + <ngram occurrences="6" value="öü" /> + <ngram occurrences="6" value="ööà_" /> + <ngram occurrences="6" value="ööà" /> + <ngram occurrences="6" value="öö" /> + <ngram occurrences="6" value="óíi" /> + <ngram occurrences="6" value="óë" /> + <ngram occurrences="6" value="óêó" /> + <ngram occurrences="6" value="òû_âå" /> + <ngram occurrences="6" value="òðîíí" /> + <ngram occurrences="6" value="òðîí" /> + <ngram occurrences="6" value="ðýäàê" /> + <ngram occurrences="6" value="ðýäà" /> + <ngram occurrences="6" value="ðûÿ" /> + <ngram occurrences="6" value="ðîíí" /> + <ngram occurrences="6" value="îíí" /> + <ngram occurrences="6" value="îæ" /> + <ngram occurrences="6" value="íòà_" /> + <ngram occurrences="6" value="íòà" /> + <ngram occurrences="6" value="íñêà" /> + <ngram occurrences="6" value="ííà" /> + <ngram occurrences="6" value="íå_" /> + <ngram occurrences="6" value="íàãà_" /> + <ngram occurrences="6" value="íàãà" /> + <ngram occurrences="6" value="íàã" /> + <ngram occurrences="6" value="íiê" /> + <ngram occurrences="6" value="íi_" /> + <ngram occurrences="6" value="ìïi" /> + <ngram occurrences="6" value="ìàë" /> + <ngram occurrences="6" value="ëüí" /> + <ngram occurrences="6" value="ëåêòð" /> + <ngram occurrences="6" value="ëåêò" /> + <ngram occurrences="6" value="êòðîí" /> + <ngram occurrences="6" value="êòðî" /> + <ngram occurrences="6" value="êòð" /> + <ngram occurrences="6" value="êàÿ_" /> + <ngram occurrences="6" value="êàÿ" /> + <ngram occurrences="6" value="é_ì" /> + <ngram occurrences="6" value="çåòû_" /> + <ngram occurrences="6" value="çåòû" /> + <ngram occurrences="6" value="åööà_" /> + <ngram occurrences="6" value="åööà" /> + <ngram occurrences="6" value="åöö" /> + <ngram occurrences="6" value="åòû_â" /> + <ngram occurrences="6" value="åòû_" /> + <ngram occurrences="6" value="åòû" /> + <ngram occurrences="6" value="åêòðî" /> + <ngram occurrences="6" value="åêòð" /> + <ngram occurrences="6" value="åêò" /> + <ngram occurrences="6" value="å_ì" /> + <ngram occurrences="6" value="å_åðí" /> + <ngram occurrences="6" value="å_åð" /> + <ngram occurrences="6" value="å_å" /> + <ngram occurrences="6" value="ãî_" /> + <ngram occurrences="6" value="ãàçåò" /> + <ngram occurrences="6" value="âå_åð" /> + <ngram occurrences="6" value="âå_å" /> + <ngram occurrences="6" value="âå_" /> + <ngram occurrences="6" value="âàðû" /> + <ngram occurrences="6" value="âàíà" /> + <ngram occurrences="6" value="áî" /> + <ngram occurrences="6" value="áåë" /> + <ngram occurrences="6" value="áå" /> + <ngram occurrences="6" value="àíí" /> + <ngram occurrences="6" value="àíà_" /> + <ngram occurrences="6" value="àêà" /> + <ngram occurrences="6" value="àçåòû" /> + <ngram occurrences="6" value="àçåò" /> + <ngram occurrences="6" value="àçà" /> + <ngram occurrences="6" value="àäà" /> +</ngrams> diff --git a/src/plugins/language/bosnian.klp b/src/plugins/language/bosnian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="845" value="_" /> + <ngram occurrences="518" value="a" /> + <ngram occurrences="391" value="e" /> + <ngram occurrences="365" value="i" /> + <ngram occurrences="340" value="o" /> + <ngram occurrences="277" value="n" /> + <ngram occurrences="266" value="j" /> + <ngram occurrences="218" value="a_" /> + <ngram occurrences="212" value="s" /> + <ngram occurrences="194" value="e_" /> + <ngram occurrences="185" value="u" /> + <ngram occurrences="175" value="r" /> + <ngram occurrences="157" value="d" /> + <ngram occurrences="146" value="je" /> + <ngram occurrences="138" value="k" /> + <ngram occurrences="131" value="t" /> + <ngram occurrences="128" value="m" /> + <ngram occurrences="126" value="v" /> + <ngram occurrences="122" value="l" /> + <ngram occurrences="119" value="p" /> + <ngram occurrences="112" value="i_" /> + <ngram occurrences="101" value="_s" /> + <ngram occurrences="100" value="c" /> + <ngram occurrences="94" value="u_" /> + <ngram occurrences="86" value="z" /> + <ngram occurrences="86" value="_n" /> + <ngram occurrences="82" value="na" /> + <ngram occurrences="81" value="_p" /> + <ngram occurrences="72" value="je_" /> + <ngram occurrences="71" value="b" /> + <ngram occurrences="69" value="o_" /> + <ngram occurrences="66" value="_i" /> + <ngram occurrences="64" value="g" /> + <ngram occurrences="62" value="_j" /> + <ngram occurrences="58" value="_d" /> + <ngram occurrences="55" value="_u" /> + <ngram occurrences="55" value="_je" /> + <ngram occurrences="52" value="ni" /> + <ngram occurrences="49" value="na_" /> + <ngram occurrences="48" value="ra" /> + <ngram occurrences="47" value="st" /> + <ngram occurrences="47" value="ij" /> + <ngram occurrences="45" value="oj" /> + <ngram occurrences="44" value="_o" /> + <ngram occurrences="43" value="no" /> + <ngram occurrences="42" value="ma" /> + <ngram occurrences="42" value="_je_" /> + <ngram occurrences="41" value="ko" /> + <ngram occurrences="41" value="en" /> + <ngram occurrences="41" value="_na" /> + <ngram occurrences="41" value="_k" /> + <ngram occurrences="40" value="la" /> + <ngram occurrences="38" value="ne" /> + <ngram occurrences="38" value="ka" /> + <ngram occurrences="38" value="an" /> + <ngram occurrences="37" value="pr" /> + <ngram occurrences="37" value="po" /> + <ngram occurrences="36" value="da" /> + <ngram occurrences="36" value="_m" /> + <ngram occurrences="36" value="_b" /> + <ngram occurrences="35" value="se" /> + <ngram occurrences="35" value="ci" /> + <ngram occurrences="35" value="_u_" /> + <ngram occurrences="34" value="vo" /> + <ngram occurrences="34" value="ja" /> + <ngram occurrences="33" value="al" /> + <ngram occurrences="33" value="_pr" /> + <ngram occurrences="33" value="_po" /> + <ngram occurrences="31" value="ri" /> + <ngram occurrences="31" value="re" /> + <ngram occurrences="31" value="_g" /> + <ngram occurrences="30" value="va" /> + <ngram occurrences="29" value="ti" /> + <ngram occurrences="29" value="ov" /> + <ngram occurrences="29" value="od" /> + <ngram occurrences="29" value="m_" /> + <ngram occurrences="29" value="h" /> + <ngram occurrences="29" value="_z" /> + <ngram occurrences="28" value="nj" /> + <ngram occurrences="28" value="e_s" /> + <ngram occurrences="28" value="am" /> + <ngram occurrences="28" value="a_j" /> + <ngram occurrences="27" value="ne_" /> + <ngram occurrences="27" value="a_s" /> + <ngram occurrences="27" value="_t" /> + <ngram occurrences="27" value="_i_" /> + <ngram occurrences="27" value="_a" /> + <ngram occurrences="26" value="os" /> + <ngram occurrences="26" value="om" /> + <ngram occurrences="26" value="la_" /> + <ngram occurrences="26" value="ji" /> + <ngram occurrences="26" value="_se" /> + <ngram occurrences="25" value="za" /> + <ngram occurrences="25" value="se_" /> + <ngram occurrences="25" value="ma_" /> + <ngram occurrences="25" value="ad" /> + <ngram occurrences="25" value="a_je" /> + <ngram occurrences="24" value="ro" /> + <ngram occurrences="24" value="e_p" /> + <ngram occurrences="24" value="dj" /> + <ngram occurrences="24" value="ba" /> + <ngram occurrences="23" value="vi" /> + <ngram occurrences="23" value="ta" /> + <ngram occurrences="23" value="li" /> + <ngram occurrences="23" value="ed" /> + <ngram occurrences="23" value="av" /> + <ngram occurrences="23" value="ar" /> + <ngram occurrences="23" value="ak" /> + <ngram occurrences="22" value="ob" /> + <ngram occurrences="22" value="in" /> + <ngram occurrences="22" value="ic" /> + <ngram occurrences="22" value="ev" /> + <ngram occurrences="22" value="e_i" /> + <ngram occurrences="22" value="dje" /> + <ngram occurrences="21" value="voj" /> + <ngram occurrences="21" value="le" /> + <ngram occurrences="21" value="im" /> + <ngram occurrences="21" value="ije" /> + <ngram occurrences="21" value="er" /> + <ngram occurrences="21" value="da_" /> + <ngram occurrences="21" value="d_" /> + <ngram occurrences="21" value="at" /> + <ngram occurrences="21" value="_se_" /> + <ngram occurrences="21" value="_r" /> + <ngram occurrences="20" value="us" /> + <ngram occurrences="20" value="jev" /> + <ngram occurrences="20" value="il" /> + <ngram occurrences="20" value="ih" /> + <ngram occurrences="20" value="go" /> + <ngram occurrences="20" value="di" /> + <ngram occurrences="20" value="ca" /> + <ngram occurrences="20" value="aj" /> + <ngram occurrences="20" value="a_p" /> + <ngram occurrences="20" value="a_n" /> + <ngram occurrences="20" value="a_je_" /> + <ngram occurrences="20" value="_na_" /> + <ngram occurrences="19" value="ju" /> + <ngram occurrences="19" value="iz" /> + <ngram occurrences="19" value="evo" /> + <ngram occurrences="19" value="e_n" /> + <ngram occurrences="19" value="djev" /> + <ngram occurrences="19" value="ac" /> + <ngram occurrences="19" value="_ko" /> + <ngram occurrences="19" value="_da" /> + <ngram occurrences="18" value="og" /> + <ngram occurrences="18" value="ke_" /> + <ngram occurrences="18" value="ke" /> + <ngram occurrences="18" value="jevoj" /> + <ngram occurrences="18" value="jevo" /> + <ngram occurrences="18" value="ih_" /> + <ngram occurrences="18" value="h_" /> + <ngram occurrences="18" value="evoj" /> + <ngram occurrences="18" value="djevo" /> + <ngram occurrences="18" value="_djev" /> + <ngram occurrences="18" value="_dje" /> + <ngram occurrences="18" value="_dj" /> + <ngram occurrences="17" value="ju_" /> + <ngram occurrences="17" value="is" /> + <ngram occurrences="17" value="es" /> + <ngram occurrences="17" value="ek" /> + <ngram occurrences="17" value="dn" /> + <ngram occurrences="17" value="ama_" /> + <ngram occurrences="17" value="ama" /> + <ngram occurrences="16" value="vojk" /> + <ngram occurrences="16" value="ve" /> + <ngram occurrences="16" value="u_n" /> + <ngram occurrences="16" value="te" /> + <ngram occurrences="16" value="su" /> + <ngram occurrences="16" value="sl" /> + <ngram occurrences="16" value="sa" /> + <ngram occurrences="16" value="or" /> + <ngram occurrences="16" value="om_" /> + <ngram occurrences="16" value="ojk" /> + <ngram occurrences="16" value="lj" /> + <ngram occurrences="16" value="jk" /> + <ngram occurrences="16" value="ja_" /> + <ngram occurrences="16" value="evojk" /> + <ngram occurrences="16" value="ce" /> + <ngram occurrences="16" value="_ka" /> + <ngram occurrences="15" value="ti_" /> + <ngram occurrences="15" value="on" /> + <ngram occurrences="15" value="n_" /> + <ngram occurrences="15" value="mu" /> + <ngram occurrences="15" value="ko_" /> + <ngram occurrences="15" value="it" /> + <ngram occurrences="15" value="ima" /> + <ngram occurrences="15" value="ija" /> + <ngram occurrences="15" value="ga" /> + <ngram occurrences="15" value="az" /> + <ngram occurrences="15" value="a_k" /> + <ngram occurrences="15" value="a_d" /> + <ngram occurrences="15" value="_v" /> + <ngram occurrences="15" value="_su" /> + <ngram occurrences="15" value="_od" /> + <ngram occurrences="15" value="_iz" /> + <ngram occurrences="15" value="_go" /> + <ngram occurrences="15" value="_ba" /> + <ngram occurrences="14" value="tr" /> + <ngram occurrences="14" value="su_" /> + <ngram occurrences="14" value="sk" /> + <ngram occurrences="14" value="jen" /> + <ngram occurrences="14" value="ik" /> + <ngram occurrences="14" value="i_n" /> + <ngram occurrences="14" value="cij" /> + <ngram occurrences="14" value="_su_" /> + <ngram occurrences="14" value="_da_" /> + <ngram occurrences="14" value="_c" /> + <ngram occurrences="14" value="_a_" /> + <ngram occurrences="13" value="za_" /> + <ngram occurrences="13" value="si" /> + <ngram occurrences="13" value="ru" /> + <ngram occurrences="13" value="pre" /> + <ngram occurrences="13" value="no_" /> + <ngram occurrences="13" value="me" /> + <ngram occurrences="13" value="ku" /> + <ngram occurrences="13" value="koj" /> + <ngram occurrences="13" value="e_u" /> + <ngram occurrences="13" value="e_pr" /> + <ngram occurrences="13" value="bi" /> + <ngram occurrences="13" value="bar" /> + <ngram occurrences="13" value="_za" /> + <ngram occurrences="13" value="_ni" /> + <ngram occurrences="13" value="_koj" /> + <ngram occurrences="12" value="zi" /> + <ngram occurrences="12" value="vojke" /> + <ngram occurrences="12" value="tu" /> + <ngram occurrences="12" value="to" /> + <ngram occurrences="12" value="ste" /> + <ngram occurrences="12" value="rij" /> + <ngram occurrences="12" value="ran" /> + <ngram occurrences="12" value="ojke_" /> + <ngram occurrences="12" value="ojke" /> + <ngram occurrences="12" value="od_" /> + <ngram occurrences="12" value="jke_" /> + <ngram occurrences="12" value="jke" /> + <ngram occurrences="12" value="ije_" /> + <ngram occurrences="12" value="i_p" /> + <ngram occurrences="12" value="ec" /> + <ngram occurrences="12" value="e_d" /> + <ngram occurrences="12" value="ati" /> + <ngram occurrences="12" value="aci" /> + <ngram occurrences="12" value="a_po" /> + <ngram occurrences="12" value="a_i" /> + <ngram occurrences="12" value="_pre" /> + <ngram occurrences="12" value="_ne" /> + <ngram occurrences="12" value="_mu" /> + <ngram occurrences="12" value="_bi" /> + <ngram occurrences="11" value="zn" /> + <ngram occurrences="11" value="ze" /> + <ngram occurrences="11" value="uc" /> + <ngram occurrences="11" value="sta" /> + <ngram occurrences="11" value="sp" /> + <ngram occurrences="11" value="rad" /> + <ngram occurrences="11" value="pro" /> + <ngram occurrences="11" value="pri" /> + <ngram occurrences="11" value="pa" /> + <ngram occurrences="11" value="ol" /> + <ngram occurrences="11" value="oji" /> + <ngram occurrences="11" value="oc" /> + <ngram occurrences="11" value="nje" /> + <ngram occurrences="11" value="nik" /> + <ngram occurrences="11" value="nam" /> + <ngram occurrences="11" value="lo" /> + <ngram occurrences="11" value="le_" /> + <ngram occurrences="11" value="k_" /> + <ngram occurrences="11" value="iv" /> + <ngram occurrences="11" value="ija_" /> + <ngram occurrences="11" value="i_s" /> + <ngram occurrences="11" value="el" /> + <ngram occurrences="11" value="e_na" /> + <ngram occurrences="11" value="do" /> + <ngram occurrences="11" value="ci_" /> + <ngram occurrences="11" value="ca_" /> + <ngram occurrences="11" value="a_o" /> + <ngram occurrences="11" value="a_m" /> + <ngram occurrences="11" value="_st" /> + <ngram occurrences="11" value="_sa" /> + <ngram occurrences="11" value="_ra" /> + <ngram occurrences="11" value="_od_" /> + <ngram occurrences="11" value="_nj" /> + <ngram occurrences="11" value="_do" /> + <ngram occurrences="10" value="u_r" /> + <ngram occurrences="10" value="s_" /> + <ngram occurrences="10" value="r_" /> + <ngram occurrences="10" value="oz" /> + <ngram occurrences="10" value="ost" /> + <ngram occurrences="10" value="o_je" /> + <ngram occurrences="10" value="o_j" /> + <ngram occurrences="10" value="ni_" /> + <ngram occurrences="10" value="na_k" /> + <ngram occurrences="10" value="mo" /> + <ngram occurrences="10" value="li_" /> + <ngram occurrences="10" value="ka_" /> + <ngram occurrences="10" value="ji_" /> + <ngram occurrences="10" value="jed" /> + <ngram occurrences="10" value="je_p" /> + <ngram occurrences="10" value="j_" /> + <ngram occurrences="10" value="ica" /> + <ngram occurrences="10" value="i_u" /> + <ngram occurrences="10" value="edn" /> + <ngram occurrences="10" value="e_u_" /> + <ngram occurrences="10" value="e_po" /> + <ngram occurrences="10" value="e_m" /> + <ngram occurrences="10" value="ce_" /> + <ngram occurrences="10" value="as" /> + <ngram occurrences="10" value="ali" /> + <ngram occurrences="10" value="a_u" /> + <ngram occurrences="10" value="_us" /> + <ngram occurrences="10" value="_tr" /> + <ngram occurrences="10" value="_pro" /> + <ngram occurrences="10" value="_pri" /> + <ngram occurrences="10" value="_im" /> + <ngram occurrences="10" value="_bar" /> + <ngram occurrences="9" value="zna" /> + <ngram occurrences="9" value="up" /> + <ngram occurrences="9" value="t_" /> + <ngram occurrences="9" value="sv" /> + <ngram occurrences="9" value="odi" /> + <ngram occurrences="9" value="o_je_" /> + <ngram occurrences="9" value="nu" /> + <ngram occurrences="9" value="io" /> + <ngram occurrences="9" value="gr" /> + <ngram occurrences="9" value="eri" /> + <ngram occurrences="9" value="de" /> + <ngram occurrences="9" value="cn" /> + <ngram occurrences="9" value="ava" /> + <ngram occurrences="9" value="ao_" /> + <ngram occurrences="9" value="ao" /> + <ngram occurrences="9" value="a_z" /> + <ngram occurrences="9" value="a_se" /> + <ngram occurrences="9" value="a_na" /> + <ngram occurrences="9" value="a_g" /> + <ngram occurrences="9" value="a_a" /> + <ngram occurrences="9" value="_no" /> + <ngram occurrences="9" value="_nam" /> + <ngram occurrences="9" value="_jed" /> + <ngram occurrences="9" value="_ima" /> + <ngram occurrences="8" value="vi_" /> + <ngram occurrences="8" value="ust" /> + <ngram occurrences="8" value="u_i" /> + <ngram occurrences="8" value="u_d" /> + <ngram occurrences="8" value="ter" /> + <ngram occurrences="8" value="sti" /> + <ngram occurrences="8" value="sn" /> + <ngram occurrences="8" value="se_p" /> + <ngram occurrences="8" value="ros" /> + <ngram occurrences="8" value="red" /> + <ngram occurrences="8" value="ova" /> + <ngram occurrences="8" value="noc" /> + <ngram occurrences="8" value="nij" /> + <ngram occurrences="8" value="mus" /> + <ngram occurrences="8" value="mi" /> + <ngram occurrences="8" value="lje" /> + <ngram occurrences="8" value="koji" /> + <ngram occurrences="8" value="jo" /> + <ngram occurrences="8" value="jih" /> + <ngram occurrences="8" value="je_i" /> + <ngram occurrences="8" value="ima_" /> + <ngram occurrences="8" value="ila_" /> + <ngram occurrences="8" value="ila" /> + <ngram occurrences="8" value="ika" /> + <ngram occurrences="8" value="i_i" /> + <ngram occurrences="8" value="gl" /> + <ngram occurrences="8" value="et" /> + <ngram occurrences="8" value="ena" /> + <ngram occurrences="8" value="e_z" /> + <ngram occurrences="8" value="e_su_" /> + <ngram occurrences="8" value="e_su" /> + <ngram occurrences="8" value="e_g" /> + <ngram occurrences="8" value="din" /> + <ngram occurrences="8" value="bo" /> + <ngram occurrences="8" value="ala" /> + <ngram occurrences="8" value="ad_" /> + <ngram occurrences="8" value="a_koj" /> + <ngram occurrences="8" value="a_ko" /> + <ngram occurrences="8" value="a_b" /> + <ngram occurrences="8" value="_za_" /> + <ngram occurrences="8" value="_sv" /> + <ngram occurrences="8" value="_sl" /> + <ngram occurrences="8" value="_noc" /> + <ngram occurrences="8" value="_mus" /> + <ngram occurrences="8" value="_koji" /> + <ngram occurrences="8" value="_h" /> + <ngram occurrences="7" value="zd" /> + <ngram occurrences="7" value="z_" /> + <ngram occurrences="7" value="va_" /> + <ngram occurrences="7" value="uster" /> + <ngram occurrences="7" value="uste" /> + <ngram occurrences="7" value="un" /> + <ngram occurrences="7" value="ug" /> + <ngram occurrences="7" value="u_u_" /> + <ngram occurrences="7" value="u_u" /> + <ngram occurrences="7" value="u_s" /> + <ngram occurrences="7" value="u_na" /> + <ngram occurrences="7" value="tra" /> + <ngram occurrences="7" value="terij" /> + <ngram occurrences="7" value="teri" /> + <ngram occurrences="7" value="ta_" /> + <ngram occurrences="7" value="steri" /> + <ngram occurrences="7" value="ster" /> +</ngrams> diff --git a/src/plugins/language/breton.klp b/src/plugins/language/breton.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="915" value="_" /> + <ngram occurrences="494" value="e" /> + <ngram occurrences="448" value="a" /> + <ngram occurrences="265" value="n" /> + <ngram occurrences="253" value="o" /> + <ngram occurrences="235" value="r" /> + <ngram occurrences="164" value="t" /> + <ngram occurrences="152" value="u" /> + <ngram occurrences="139" value="i" /> + <ngram occurrences="137" value="l" /> + <ngram occurrences="137" value="h" /> + <ngram occurrences="131" value="a_" /> + <ngram occurrences="129" value="d" /> + <ngram occurrences="109" value="_a" /> + <ngram occurrences="106" value="r_" /> + <ngram occurrences="105" value="z" /> + <ngram occurrences="103" value="t_" /> + <ngram occurrences="103" value="m" /> + <ngram occurrences="101" value="_e" /> + <ngram occurrences="96" value="g" /> + <ngram occurrences="95" value="n_" /> + <ngram occurrences="95" value="e_" /> + <ngram occurrences="93" value="_h" /> + <ngram occurrences="86" value="s" /> + <ngram occurrences="77" value="v" /> + <ngram occurrences="77" value="k" /> + <ngram occurrences="73" value="an" /> + <ngram occurrences="73" value="_d" /> + <ngram occurrences="72" value="en" /> + <ngram occurrences="70" value="ou" /> + <ngram occurrences="68" value="b" /> + <ngram occurrences="64" value="c" /> + <ngram occurrences="60" value="et" /> + <ngram occurrences="59" value="p" /> + <ngram occurrences="57" value="_g" /> + <ngram occurrences="51" value="er" /> + <ngram occurrences="51" value="_m" /> + <ngram occurrences="50" value="oa" /> + <ngram occurrences="49" value="c_h" /> + <ngram occurrences="49" value="c_" /> + <ngram occurrences="49" value="ar" /> + <ngram occurrences="49" value="_o" /> + <ngram occurrences="48" value="et_" /> + <ngram occurrences="48" value="_p" /> + <ngram occurrences="47" value="ez" /> + <ngram occurrences="46" value="ur" /> + <ngram occurrences="42" value="_k" /> + <ngram occurrences="41" value="z_" /> + <ngram occurrences="38" value="ur_" /> + <ngram occurrences="38" value="l_" /> + <ngram occurrences="38" value="d_" /> + <ngram occurrences="38" value="_e_" /> + <ngram occurrences="38" value="_b" /> + <ngram occurrences="37" value="nn" /> + <ngram occurrences="37" value="ne" /> + <ngram occurrences="36" value="nt" /> + <ngram occurrences="36" value="_a_" /> + <ngram occurrences="35" value="ñ" /> + <ngram occurrences="35" value="ma" /> + <ngram occurrences="35" value="ha" /> + <ngram occurrences="34" value="s_" /> + <ngram occurrences="34" value="re" /> + <ngram occurrences="32" value="de" /> + <ngram occurrences="31" value="ra" /> + <ngram occurrences="31" value="nt_" /> + <ngram occurrences="31" value="ar_" /> + <ngram occurrences="31" value="_u" /> + <ngram occurrences="31" value="_c" /> + <ngram occurrences="30" value="h_" /> + <ngram occurrences="30" value="_l" /> + <ngram occurrences="29" value="_ha" /> + <ngram occurrences="28" value="ve" /> + <ngram occurrences="28" value="er_" /> + <ngram occurrences="28" value="enn" /> + <ngram occurrences="28" value="el" /> + <ngram occurrences="28" value="be" /> + <ngram occurrences="28" value="an_" /> + <ngram occurrences="28" value="_ma" /> + <ngram occurrences="27" value="ñ_" /> + <ngram occurrences="27" value="w" /> + <ngram occurrences="27" value="ho" /> + <ngram occurrences="27" value="ga" /> + <ngram occurrences="26" value="oa_" /> + <ngram occurrences="26" value="_v" /> + <ngram occurrences="26" value="_c_h" /> + <ngram occurrences="26" value="_c_" /> + <ngram occurrences="25" value="zh" /> + <ngram occurrences="25" value="o_" /> + <ngram occurrences="25" value="le" /> + <ngram occurrences="25" value="ke" /> + <ngram occurrences="25" value="he" /> + <ngram occurrences="25" value="eu" /> + <ngram occurrences="25" value="_n" /> + <ngram occurrences="24" value="pe" /> + <ngram occurrences="24" value="en_" /> + <ngram occurrences="24" value="añ" /> + <ngram occurrences="24" value="_oa" /> + <ngram occurrences="24" value="_ga" /> + <ngram occurrences="23" value="añ_" /> + <ngram occurrences="23" value="ant" /> + <ngram occurrences="23" value="ad" /> + <ngram occurrences="22" value="ù_" /> + <ngram occurrences="22" value="ù" /> + <ngram occurrences="22" value="où_" /> + <ngram occurrences="22" value="où" /> + <ngram occurrences="22" value="me" /> + <ngram occurrences="22" value="ll" /> + <ngram occurrences="22" value="ka" /> + <ngram occurrences="22" value="_r" /> + <ngram occurrences="22" value="_pe" /> + <ngram occurrences="22" value="_ar" /> + <ngram occurrences="21" value="us" /> + <ngram occurrences="21" value="ma_" /> + <ngram occurrences="21" value="la" /> + <ngram occurrences="21" value="da" /> + <ngram occurrences="21" value="al" /> + <ngram occurrences="21" value="_t" /> + <ngram occurrences="21" value="_ma_" /> + <ngram occurrences="21" value="_ho" /> + <ngram occurrences="21" value="_an" /> + <ngram occurrences="20" value="us_" /> + <ngram occurrences="20" value="in" /> + <ngram occurrences="20" value="gan" /> + <ngram occurrences="20" value="em" /> + <ngram occurrences="20" value="ant_" /> + <ngram occurrences="20" value="_oa_" /> + <ngram occurrences="20" value="_ar_" /> + <ngram occurrences="19" value="ro" /> + <ngram occurrences="19" value="our" /> + <ngram occurrences="19" value="na" /> + <ngram occurrences="19" value="g_" /> + <ngram occurrences="19" value="di" /> + <ngram occurrences="19" value="_ur_" /> + <ngram occurrences="19" value="_ur" /> + <ngram occurrences="19" value="_s" /> + <ngram occurrences="19" value="_gan" /> + <ngram occurrences="18" value="on" /> + <ngram occurrences="18" value="go" /> + <ngram occurrences="18" value="ez_" /> + <ngram occurrences="18" value="bo" /> + <ngram occurrences="18" value="ao" /> + <ngram occurrences="18" value="am" /> + <ngram occurrences="18" value="_ke" /> + <ngram occurrences="17" value="ze" /> + <ngram occurrences="17" value="ue" /> + <ngram occurrences="17" value="tr" /> + <ngram occurrences="17" value="t_a" /> + <ngram occurrences="17" value="ha_" /> + <ngram occurrences="17" value="ezh" /> + <ngram occurrences="17" value="ed" /> + <ngram occurrences="17" value="_ka" /> + <ngram occurrences="17" value="_ha_" /> + <ngram occurrences="17" value="_de" /> + <ngram occurrences="17" value="_be" /> + <ngram occurrences="16" value="vez" /> + <ngram occurrences="16" value="r_g" /> + <ngram occurrences="16" value="nn_" /> + <ngram occurrences="16" value="m_" /> + <ngram occurrences="16" value="eus_" /> + <ngram occurrences="16" value="eus" /> + <ngram occurrences="16" value="c_ho" /> + <ngram occurrences="16" value="ab" /> + <ngram occurrences="16" value="_ne" /> + <ngram occurrences="16" value="_di" /> + <ngram occurrences="16" value="_c_ho" /> + <ngram occurrences="15" value="hoa" /> + <ngram occurrences="15" value="gant" /> + <ngram occurrences="15" value="enn_" /> + <ngram occurrences="15" value="e_oa" /> + <ngram occurrences="15" value="e_o" /> + <ngram occurrences="15" value="c_h_" /> + <ngram occurrences="15" value="ae" /> + <ngram occurrences="15" value="_la" /> + <ngram occurrences="15" value="_hoa" /> + <ngram occurrences="15" value="_he" /> + <ngram occurrences="15" value="_h_" /> + <ngram occurrences="15" value="_da" /> + <ngram occurrences="14" value="ut" /> + <ngram occurrences="14" value="to" /> + <ngram occurrences="14" value="out" /> + <ngram occurrences="14" value="oue" /> + <ngram occurrences="14" value="n_e" /> + <ngram occurrences="14" value="iz" /> + <ngram occurrences="14" value="f" /> + <ngram occurrences="14" value="el_" /> + <ngram occurrences="14" value="ch" /> + <ngram occurrences="14" value="c_hoa" /> + <ngram occurrences="14" value="a_c" /> + <ngram occurrences="14" value="_gant" /> + <ngram occurrences="14" value="_eu" /> + <ngram occurrences="14" value="_an_" /> + <ngram occurrences="13" value="vi" /> + <ngram occurrences="13" value="un" /> + <ngram occurrences="13" value="t_e" /> + <ngram occurrences="13" value="k_" /> + <ngram occurrences="13" value="iv" /> + <ngram occurrences="13" value="ev" /> + <ngram occurrences="13" value="eg" /> + <ngram occurrences="13" value="ed_" /> + <ngram occurrences="13" value="e_oa_" /> + <ngram occurrences="13" value="bou" /> + <ngram occurrences="13" value="all" /> + <ngram occurrences="13" value="ad_" /> + <ngram occurrences="13" value="a_c_h" /> + <ngram occurrences="13" value="a_c_" /> + <ngram occurrences="13" value="_eus_" /> + <ngram occurrences="13" value="_eus" /> + <ngram occurrences="12" value="zh_" /> + <ngram occurrences="12" value="va" /> + <ngram occurrences="12" value="ta" /> + <ngram occurrences="12" value="st" /> + <ngram occurrences="12" value="ri" /> + <ngram occurrences="12" value="our_" /> + <ngram occurrences="12" value="no" /> + <ngram occurrences="12" value="ni" /> + <ngram occurrences="12" value="ne_" /> + <ngram occurrences="12" value="n_d" /> + <ngram occurrences="12" value="ll_" /> + <ngram occurrences="12" value="ket_" /> + <ngram occurrences="12" value="ket" /> + <ngram occurrences="12" value="gw" /> + <ngram occurrences="12" value="gant_" /> + <ngram occurrences="12" value="es" /> + <ngram occurrences="12" value="e_d" /> + <ngram occurrences="12" value="a_o" /> + <ngram occurrences="12" value="a_m" /> + <ngram occurrences="12" value="_me" /> + <ngram occurrences="12" value="_go" /> + <ngram occurrences="11" value="z_e" /> + <ngram occurrences="11" value="we" /> + <ngram occurrences="11" value="vo" /> + <ngram occurrences="11" value="ut_" /> + <ngram occurrences="11" value="tra" /> + <ngram occurrences="11" value="r_e" /> + <ngram occurrences="11" value="out_" /> + <ngram occurrences="11" value="oar" /> + <ngram occurrences="11" value="n_a" /> + <ngram occurrences="11" value="is" /> + <ngram occurrences="11" value="in_" /> + <ngram occurrences="11" value="i_" /> + <ngram occurrences="11" value="ge" /> + <ngram occurrences="11" value="ec" /> + <ngram occurrences="11" value="da_" /> + <ngram occurrences="11" value="d_a" /> + <ngram occurrences="11" value="ber" /> + <ngram occurrences="11" value="av" /> + <ngram occurrences="11" value="aou" /> + <ngram occurrences="11" value="ag" /> + <ngram occurrences="11" value="abou" /> + <ngram occurrences="11" value="abo" /> + <ngram occurrences="11" value="_w" /> + <ngram occurrences="11" value="_i" /> + <ngram occurrences="11" value="_gw" /> + <ngram occurrences="11" value="_em" /> + <ngram occurrences="11" value="_da_" /> + <ngram occurrences="10" value="vez_" /> + <ngram occurrences="10" value="te" /> + <ngram occurrences="10" value="t_d" /> + <ngram occurrences="10" value="sk" /> + <ngram occurrences="10" value="oz" /> + <ngram occurrences="10" value="oc" /> + <ngram occurrences="10" value="li" /> + <ngram occurrences="10" value="labou" /> + <ngram occurrences="10" value="labo" /> + <ngram occurrences="10" value="lab" /> + <ngram occurrences="10" value="ko" /> + <ngram occurrences="10" value="io" /> + <ngram occurrences="10" value="hi" /> + <ngram occurrences="10" value="gou" /> + <ngram occurrences="10" value="bour" /> + <ngram occurrences="10" value="abour" /> + <ngram occurrences="10" value="a_r" /> + <ngram occurrences="10" value="_z" /> + <ngram occurrences="10" value="_ket_" /> + <ngram occurrences="10" value="_ket" /> + <ngram occurrences="10" value="_f" /> + <ngram occurrences="10" value="_en" /> + <ngram occurrences="10" value="_d_" /> + <ngram occurrences="10" value="_am" /> + <ngram occurrences="9" value="za" /> + <ngram occurrences="9" value="t_p" /> + <ngram occurrences="9" value="t_k" /> + <ngram occurrences="9" value="t_a_" /> + <ngram occurrences="9" value="re_" /> + <ngram occurrences="9" value="ra_" /> + <ngram occurrences="9" value="r_p" /> + <ngram occurrences="9" value="pa" /> + <ngram occurrences="9" value="oz_" /> + <ngram occurrences="9" value="l_l" /> + <ngram occurrences="9" value="iz_" /> + <ngram occurrences="9" value="il" /> + <ngram occurrences="9" value="hoar" /> + <ngram occurrences="9" value="etr" /> + <ngram occurrences="9" value="ent" /> + <ngram occurrences="9" value="e_v" /> + <ngram occurrences="9" value="bet_" /> + <ngram occurrences="9" value="bet" /> + <ngram occurrences="9" value="ba" /> + <ngram occurrences="9" value="ann" /> + <ngram occurrences="9" value="a_v" /> + <ngram occurrences="9" value="a_oa" /> + <ngram occurrences="9" value="a_ma" /> + <ngram occurrences="9" value="a_d" /> + <ngram occurrences="9" value="a_a" /> + <ngram occurrences="9" value="_un" /> + <ngram occurrences="9" value="_ra" /> + <ngram occurrences="9" value="_o_" /> + <ngram occurrences="9" value="_ne_" /> + <ngram occurrences="9" value="_labo" /> + <ngram occurrences="9" value="_lab" /> + <ngram occurrences="9" value="_hoar" /> + <ngram occurrences="9" value="_ev" /> + <ngram occurrences="9" value="_en_" /> + <ngram occurrences="9" value="_bet_" /> + <ngram occurrences="9" value="_bet" /> + <ngram occurrences="9" value="_a_r" /> + <ngram occurrences="8" value="ñ_e" /> + <ngram occurrences="8" value="z_a" /> + <ngram occurrences="8" value="wa" /> + <ngram occurrences="8" value="ul" /> + <ngram occurrences="8" value="tra_" /> + <ngram occurrences="8" value="rez" /> + <ngram occurrences="8" value="pr" /> + <ngram occurrences="8" value="petra" /> + <ngram occurrences="8" value="petr" /> + <ngram occurrences="8" value="pet" /> + <ngram occurrences="8" value="ober_" /> + <ngram occurrences="8" value="ober" /> + <ngram occurrences="8" value="obe" /> + <ngram occurrences="8" value="ob" /> + <ngram occurrences="8" value="nna" /> + <ngram occurrences="8" value="j" /> + <ngram occurrences="8" value="ive" /> + <ngram occurrences="8" value="ie" /> + <ngram occurrences="8" value="g_a" /> + <ngram occurrences="8" value="etra_" /> + <ngram occurrences="8" value="etra" /> + <ngram occurrences="8" value="eo" /> + <ngram occurrences="8" value="ent_" /> + <ngram occurrences="8" value="eme" /> + <ngram occurrences="8" value="eg_" /> + <ngram occurrences="8" value="ec_h" /> + <ngram occurrences="8" value="ec_" /> + <ngram occurrences="8" value="do" /> + <ngram occurrences="8" value="che" /> + <ngram occurrences="8" value="br" /> + <ngram occurrences="8" value="bour_" /> + <ngram occurrences="8" value="ber_" /> + <ngram occurrences="8" value="at" /> + <ngram occurrences="8" value="as" /> + <ngram occurrences="8" value="ade" /> + <ngram occurrences="8" value="a_ra" /> + <ngram occurrences="8" value="_vo" /> + <ngram occurrences="8" value="_pr" /> + <ngram occurrences="8" value="_petr" /> + <ngram occurrences="8" value="_pet" /> + <ngram occurrences="8" value="_ober" /> + <ngram occurrences="8" value="_obe" /> + <ngram occurrences="8" value="_ob" /> + <ngram occurrences="8" value="_hi" /> + <ngram occurrences="8" value="_gou" /> + <ngram occurrences="8" value="_e_oa" /> + <ngram occurrences="8" value="_e_o" /> + <ngram occurrences="7" value="y" /> + <ngram occurrences="7" value="un_" /> + <ngram occurrences="7" value="u_" /> + <ngram occurrences="7" value="t_e_" /> + <ngram occurrences="7" value="so" /> + <ngram occurrences="7" value="se" /> + <ngram occurrences="7" value="s_a" /> + <ngram occurrences="7" value="rv" /> + <ngram occurrences="7" value="r_s" /> + <ngram occurrences="7" value="r_h" /> + <ngram occurrences="7" value="r_b" /> + <ngram occurrences="7" value="r_a" /> + <ngram occurrences="7" value="pl" /> + <ngram occurrences="7" value="or" /> + <ngram occurrences="7" value="on_" /> + <ngram occurrences="7" value="nt_a" /> + <ngram occurrences="7" value="n_t" /> + <ngram occurrences="7" value="n_h" /> + <ngram occurrences="7" value="mz" /> + <ngram occurrences="7" value="mo" /> + <ngram occurrences="7" value="met" /> + <ngram occurrences="7" value="lu" /> + <ngram occurrences="7" value="ivez_" /> + <ngram occurrences="7" value="ivez" /> + <ngram occurrences="7" value="it" /> + <ngram occurrences="7" value="hag_" /> + <ngram occurrences="7" value="hag" /> + <ngram occurrences="7" value="ezh_" /> + <ngram occurrences="7" value="et_k" /> + <ngram occurrences="7" value="et_e" /> + <ngram occurrences="7" value="er_g" /> + <ngram occurrences="7" value="ell" /> + <ngram occurrences="7" value="ek" /> + <ngram occurrences="7" value="ec_h_" /> + <ngram occurrences="7" value="e_m" /> + <ngram occurrences="7" value="e_g" /> + <ngram occurrences="7" value="dr" /> +</ngrams> diff --git a/src/plugins/language/bulgarian.klp b/src/plugins/language/bulgarian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="802" value="_" /> + <ngram occurrences="468" value="ð" /> + <ngram occurrences="391" value="ø" /> + <ngram occurrences="352" value="þ" /> + <ngram occurrences="343" value="õ" /> + <ngram occurrences="335" value="â" /> + <ngram occurrences="297" value="ý" /> + <ngram occurrences="241" value="á" /> + <ngram occurrences="218" value="à" /> + <ngram occurrences="201" value="ð_" /> + <ngram occurrences="171" value="ò" /> + <ngram occurrences="161" value="ú" /> + <ngram occurrences="137" value="ø_" /> + <ngram occurrences="114" value="õ_" /> + <ngram occurrences="112" value="þ_" /> + <ngram occurrences="111" value="ß" /> + <ngram occurrences="103" value="ô" /> + <ngram occurrences="101" value="û" /> + <ngram occurrences="95" value="ýð" /> + <ngram occurrences="92" value="_á" /> + <ngram occurrences="84" value="_ý" /> + <ngram occurrences="81" value="áâ" /> + <ngram occurrences="74" value="ýø" /> + <ngram occurrences="74" value="ï" /> + <ngram occurrences="72" value="_ß" /> + <ngram occurrences="71" value="ýð_" /> + <ngram occurrences="70" value="ü" /> + <ngram occurrences="69" value="_ø" /> + <ngram occurrences="68" value="âõ" /> + <ngram occurrences="63" value="àð" /> + <ngram occurrences="60" value="ó" /> + <ngram occurrences="60" value="_ýð" /> + <ngram occurrences="56" value="ñ" /> + <ngram occurrences="56" value="âþ" /> + <ngram occurrences="53" value="ê" /> + <ngram occurrences="53" value="â_" /> + <ngram occurrences="52" value="ç" /> + <ngram occurrences="49" value="âð" /> + <ngram occurrences="49" value="_ò" /> + <ngram occurrences="47" value="ðâ" /> + <ngram occurrences="47" value="_ýð_" /> + <ngram occurrences="46" value="þâ" /> + <ngram occurrences="46" value="øâ" /> + <ngram occurrences="46" value="_ú" /> + <ngram occurrences="45" value="_ð" /> + <ngram occurrences="44" value="õý" /> + <ngram occurrences="44" value="ã" /> + <ngram occurrences="44" value="_þ" /> + <ngram occurrences="43" value="ðý" /> + <ngram occurrences="42" value="àõ" /> + <ngram occurrences="41" value="âþ_" /> + <ngram occurrences="41" value="ßà" /> + <ngram occurrences="40" value="òð" /> + <ngram occurrences="39" value="þá" /> + <ngram occurrences="39" value="ýþ" /> + <ngram occurrences="39" value="úþ" /> + <ngram occurrences="39" value="øâõ" /> + <ngram occurrences="39" value="àø" /> + <ngram occurrences="39" value="_ô" /> + <ngram occurrences="39" value="_à" /> + <ngram occurrences="36" value="ßþ" /> + <ngram occurrences="36" value="_õ" /> + <ngram occurrences="34" value="ï_" /> + <ngram occurrences="34" value="_ßà" /> + <ngram occurrences="33" value="õâ" /> + <ngram occurrences="33" value="àþ" /> + <ngram occurrences="32" value="úð" /> + <ngram occurrences="31" value="_ø_" /> + <ngram occurrences="30" value="ýø_" /> + <ngram occurrences="30" value="âø" /> + <ngram occurrences="30" value="âõ_" /> + <ngram occurrences="29" value="øï" /> + <ngram occurrences="28" value="ýõ" /> + <ngram occurrences="28" value="øâõ_" /> + <ngram occurrences="28" value="ôð" /> + <ngram occurrences="28" value="ò_" /> + <ngram occurrences="28" value="ðò" /> + <ngram occurrences="28" value="âð_" /> + <ngram occurrences="28" value="áõ" /> + <ngram occurrences="28" value="_ßþ" /> + <ngram occurrences="27" value="_ü" /> + <ngram occurrences="26" value="øï_" /> + <ngram occurrences="26" value="ðú" /> + <ngram occurrences="26" value="ä" /> + <ngram occurrences="25" value="ðà" /> + <ngram occurrences="25" value="ð_á" /> + <ngram occurrences="25" value="áú" /> + <ngram occurrences="25" value="_â" /> + <ngram occurrences="25" value="_áõ" /> + <ngram occurrences="24" value="ûø" /> + <ngram occurrences="24" value="øú" /> + <ngram occurrences="24" value="õá" /> + <ngram occurrences="24" value="õà" /> + <ngram occurrences="24" value="ð_ß" /> + <ngram occurrences="23" value="øý" /> + <ngram occurrences="23" value="õô" /> + <ngram occurrences="23" value="õ_ø" /> + <ngram occurrences="23" value="òõ" /> + <ngram occurrences="23" value="_ñ" /> + <ngram occurrences="22" value="áõ_" /> + <ngram occurrences="22" value="_þâ" /> + <ngram occurrences="22" value="_áõ_" /> + <ngram occurrences="21" value="ö" /> + <ngram occurrences="21" value="òþ" /> + <ngram occurrences="21" value="_ôð" /> + <ngram occurrences="20" value="þáâ" /> + <ngram occurrences="20" value="ø_ø" /> + <ngram occurrences="20" value="ôð_" /> + <ngram occurrences="20" value="ðâ_" /> + <ngram occurrences="20" value="è" /> + <ngram occurrences="19" value="þó" /> + <ngram occurrences="19" value="úø" /> + <ngram occurrences="19" value="õ_ý" /> + <ngram occurrences="19" value="ðýø" /> + <ngram occurrences="19" value="é" /> + <ngram occurrences="19" value="æ" /> + <ngram occurrences="19" value="âò" /> + <ngram occurrences="19" value="_ò_" /> + <ngram occurrences="18" value="þ_á" /> + <ngram occurrences="18" value="ýøâõ" /> + <ngram occurrences="18" value="ýøâ" /> + <ngram occurrences="18" value="õû" /> + <ngram occurrences="18" value="ð_ú" /> + <ngram occurrences="18" value="âý" /> + <ngram occurrences="18" value="_õ_" /> + <ngram occurrences="18" value="_ôð_" /> + <ngram occurrences="18" value="_ó" /> + <ngram occurrences="17" value="ýþ_" /> + <ngram occurrences="17" value="ýøâõ_" /> + <ngram occurrences="17" value="ýâ" /> + <ngram occurrences="17" value="ú_" /> + <ngram occurrences="17" value="øá" /> + <ngram occurrences="17" value="òø" /> + <ngram occurrences="17" value="_ð_" /> + <ngram occurrences="16" value="þ_ý" /> + <ngram occurrences="16" value="ýá" /> + <ngram occurrences="16" value="ûý" /> + <ngram occurrences="16" value="ûõ" /> + <ngram occurrences="16" value="øú_" /> + <ngram occurrences="16" value="òð_" /> + <ngram occurrences="16" value="ðâð" /> + <ngram occurrences="16" value="ð_ð" /> + <ngram occurrences="16" value="áø" /> + <ngram occurrences="16" value="áâò" /> + <ngram occurrences="16" value="_àð" /> + <ngram occurrences="15" value="þñ" /> + <ngram occurrences="15" value="üþ" /> + <ngram occurrences="15" value="üø" /> + <ngram occurrences="15" value="û_" /> + <ngram occurrences="15" value="úþ_" /> + <ngram occurrences="15" value="ù" /> + <ngram occurrences="15" value="øç" /> + <ngram occurrences="15" value="øà" /> + <ngram occurrences="15" value="õâþ" /> + <ngram occurrences="15" value="õ_þ" /> + <ngram occurrences="15" value="õ_ýð" /> + <ngram occurrences="15" value="ôþ" /> + <ngram occurrences="15" value="óð" /> + <ngram occurrences="15" value="áê" /> + <ngram occurrences="15" value="á_" /> + <ngram occurrences="15" value="_ýõ" /> + <ngram occurrences="15" value="_àõ" /> + <ngram occurrences="14" value="þô" /> + <ngram occurrences="14" value="ûð" /> + <ngram occurrences="14" value="øò" /> + <ngram occurrences="14" value="õâþ_" /> + <ngram occurrences="14" value="õáâ" /> + <ngram occurrences="14" value="õ_ýð_" /> + <ngram occurrences="14" value="ð_ò" /> + <ngram occurrences="14" value="ð_à" /> + <ngram occurrences="14" value="å" /> + <ngram occurrences="14" value="áû" /> + <ngram occurrences="14" value="ßàõ" /> + <ngram occurrences="13" value="þò" /> + <ngram occurrences="13" value="ý_" /> + <ngram occurrences="13" value="üõ" /> + <ngram occurrences="13" value="øàð" /> + <ngram occurrences="13" value="ø_ý" /> + <ngram occurrences="13" value="ø_ß" /> + <ngram occurrences="13" value="õýø" /> + <ngram occurrences="13" value="ôø" /> + <ngram occurrences="13" value="ôõ" /> + <ngram occurrences="13" value="ñð" /> + <ngram occurrences="13" value="ðâð_" /> + <ngram occurrences="13" value="çø" /> + <ngram occurrences="13" value="æø" /> + <ngram occurrences="13" value="áúø" /> + <ngram occurrences="13" value="áð" /> + <ngram occurrences="13" value="áâõ" /> + <ngram occurrences="13" value="àðý" /> + <ngram occurrences="13" value="àð_" /> + <ngram occurrences="13" value="ßàþ" /> + <ngram occurrences="13" value="_úþ" /> + <ngram occurrences="12" value="½" /> + <ngram occurrences="12" value="þû" /> + <ngram occurrences="12" value="þà" /> + <ngram occurrences="12" value="þß" /> + <ngram occurrences="12" value="þ_ß" /> + <ngram occurrences="12" value="ýð_á" /> + <ngram occurrences="12" value="úðâ" /> + <ngram occurrences="12" value="úâ" /> + <ngram occurrences="12" value="øü" /> + <ngram occurrences="12" value="ðúâ" /> + <ngram occurrences="12" value="ðä" /> + <ngram occurrences="12" value="ðá" /> + <ngram occurrences="12" value="ð_ßà" /> + <ngram occurrences="12" value="çõ" /> + <ngram occurrences="12" value="âõà" /> + <ngram occurrences="12" value="ßþá" /> + <ngram occurrences="12" value="_½" /> + <ngram occurrences="12" value="_úð" /> + <ngram occurrences="12" value="_ç" /> + <ngram occurrences="12" value="_ßàõ" /> + <ngram occurrences="11" value="þâþ" /> + <ngram occurrences="11" value="ýõ_" /> + <ngram occurrences="11" value="ûø_" /> + <ngram occurrences="11" value="úø_" /> + <ngram occurrences="11" value="úê" /> + <ngram occurrences="11" value="úà" /> + <ngram occurrences="11" value="òï" /> + <ngram occurrences="11" value="ðýõ" /> + <ngram occurrences="11" value="ðû" /> + <ngram occurrences="11" value="ðàø" /> + <ngram occurrences="11" value="ð_ý" /> + <ngram occurrences="11" value="áâð" /> + <ngram occurrences="11" value="àõ_" /> + <ngram occurrences="11" value="_ñð" /> + <ngram occurrences="11" value="_ã" /> + <ngram occurrences="11" value="_á_" /> + <ngram occurrences="10" value="þâþ_" /> + <ngram occurrences="10" value="þâ_" /> + <ngram occurrences="10" value="þ_ýð" /> + <ngram occurrences="10" value="ýþá" /> + <ngram occurrences="10" value="ûðò" /> + <ngram occurrences="10" value="úð_" /> + <ngram occurrences="10" value="øýð" /> + <ngram occurrences="10" value="øõ" /> + <ngram occurrences="10" value="øâõû" /> + <ngram occurrences="10" value="øáâ" /> + <ngram occurrences="10" value="ø_â" /> + <ngram occurrences="10" value="õûý" /> + <ngram occurrences="10" value="õò" /> + <ngram occurrences="10" value="õàø" /> + <ngram occurrences="10" value="óþ" /> + <ngram occurrences="10" value="óà" /> + <ngram occurrences="10" value="ñþ" /> + <ngram occurrences="10" value="ñø" /> + <ngram occurrences="10" value="ðòï" /> + <ngram occurrences="10" value="ð_ô" /> + <ngram occurrences="10" value="ð_àõ" /> + <ngram occurrences="10" value="çý" /> + <ngram occurrences="10" value="âõý" /> + <ngram occurrences="10" value="âõû" /> + <ngram occurrences="10" value="áò" /> + <ngram occurrences="10" value="áâõý" /> + <ngram occurrences="10" value="ßàø" /> + <ngram occurrences="10" value="_þâ_" /> + <ngram occurrences="10" value="_üþ" /> + <ngram occurrences="10" value="_ôþ" /> + <ngram occurrences="10" value="_áê" /> + <ngram occurrences="10" value="_áâ" /> + <ngram occurrences="10" value="_ßàþ" /> + <ngram occurrences="10" value="_ßàø" /> + <ngram occurrences="9" value="þù" /> + <ngram occurrences="9" value="þ_ø" /> + <ngram occurrences="9" value="ýøï_" /> + <ngram occurrences="9" value="ýøï" /> + <ngram occurrences="9" value="ýð_ð" /> + <ngram occurrences="9" value="ýð_ß" /> + <ngram occurrences="9" value="ûýø" /> + <ngram occurrences="9" value="úâõàø" /> + <ngram occurrences="9" value="úâõà" /> + <ngram occurrences="9" value="úâõ" /> + <ngram occurrences="9" value="øû" /> + <ngram occurrences="9" value="øõ_" /> + <ngram occurrences="9" value="øâõûý" /> + <ngram occurrences="9" value="ø_ýð" /> + <ngram occurrences="9" value="ø_ô" /> + <ngram occurrences="9" value="õýâ" /> + <ngram occurrences="9" value="ôð_á" /> + <ngram occurrences="9" value="ô_" /> + <ngram occurrences="9" value="óàð" /> + <ngram occurrences="9" value="òðý" /> + <ngram occurrences="9" value="òðâ" /> + <ngram occurrences="9" value="ñðúâõ" /> + <ngram occurrences="9" value="ñðúâ" /> + <ngram occurrences="9" value="ñðú" /> + <ngram occurrences="9" value="ðýø_" /> + <ngram occurrences="9" value="ðúâõà" /> + <ngram occurrences="9" value="ðúâõ" /> + <ngram occurrences="9" value="ðß" /> + <ngram occurrences="9" value="ð_ð_" /> + <ngram occurrences="9" value="ð_áõ_" /> + <ngram occurrences="9" value="ð_áõ" /> + <ngram occurrences="9" value="çð" /> + <ngram occurrences="9" value="ãá" /> + <ngram occurrences="9" value="âþ_á" /> + <ngram occurrences="9" value="âýþ" /> + <ngram occurrences="9" value="âõûý" /> + <ngram occurrences="9" value="âõàø" /> + <ngram occurrences="9" value="áõ_þ" /> + <ngram occurrences="9" value="áâþ" /> + <ngram occurrences="9" value="_øá" /> + <ngram occurrences="9" value="_áõ_þ" /> + <ngram occurrences="9" value="_áð" /> + <ngram occurrences="8" value="¸" /> + <ngram occurrences="8" value="þ_ò" /> + <ngram occurrences="8" value="þ_ð" /> + <ngram occurrences="8" value="þ_áõ" /> + <ngram occurrences="8" value="ýþáâ" /> + <ngram occurrences="8" value="ü_" /> + <ngram occurrences="8" value="øø" /> + <ngram occurrences="8" value="øáâõ" /> + <ngram occurrences="8" value="ø_ú" /> + <ngram occurrences="8" value="ø_á" /> + <ngram occurrences="8" value="õú" /> + <ngram occurrences="8" value="õâø" /> + <ngram occurrences="8" value="õ_á" /> + <ngram occurrences="8" value="õ_ß" /> + <ngram occurrences="8" value="òðâ_" /> + <ngram occurrences="8" value="òê" /> + <ngram occurrences="8" value="ðô" /> + <ngram occurrences="8" value="ðñ" /> + <ngram occurrences="8" value="ðâþ" /> + <ngram occurrences="8" value="ð_ü" /> + <ngram occurrences="8" value="ð_ñ" /> + <ngram occurrences="8" value="ïâ" /> + <ngram occurrences="8" value="éõ" /> + <ngram occurrences="8" value="èð" /> + <ngram occurrences="8" value="âà" /> + <ngram occurrences="8" value="â_ý" /> + <ngram occurrences="8" value="áûðò" /> + <ngram occurrences="8" value="áûð" /> + <ngram occurrences="8" value="áâø" /> + <ngram occurrences="8" value="áâ_" /> + <ngram occurrences="8" value="àø_" /> + <ngram occurrences="8" value="àðâ" /> + <ngram occurrences="8" value="ßð" /> + <ngram occurrences="8" value="_¸" /> + <ngram occurrences="8" value="_ýð_á" /> + <ngram occurrences="8" value="_úê" /> + <ngram occurrences="8" value="_øú" /> + <ngram occurrences="8" value="_øáâ" /> + <ngram occurrences="8" value="_õô" /> + <ngram occurrences="8" value="_õ_ø" /> + <ngram occurrences="8" value="_ôð_á" /> + <ngram occurrences="8" value="_òð" /> + <ngram occurrences="8" value="_è" /> + <ngram occurrences="8" value="_àõ_" /> + <ngram occurrences="7" value="þý" /> + <ngram occurrences="7" value="þ_ýð_" /> + <ngram occurrences="7" value="þ_õ" /> + <ngram occurrences="7" value="ýï" /> + <ngram occurrences="7" value="ýâý" /> + <ngram occurrences="7" value="ýáú" /> + <ngram occurrences="7" value="ýáâ" /> + <ngram occurrences="7" value="üð" /> + <ngram occurrences="7" value="ûðòïý" /> + <ngram occurrences="7" value="ûðòï" /> + <ngram occurrences="7" value="øø_" /> + <ngram occurrences="7" value="øáâõý" /> + <ngram occurrences="7" value="ø_ü" /> + <ngram occurrences="7" value="ø_ø_" /> + <ngram occurrences="7" value="ø_ò" /> + <ngram occurrences="7" value="öý" /> + <ngram occurrences="7" value="õýâý" /> + <ngram occurrences="7" value="õý_" /> + <ngram occurrences="7" value="õü" /> + <ngram occurrences="7" value="õ_øáâ" /> + <ngram occurrences="7" value="õ_øá" /> + <ngram occurrences="7" value="ôð_áõ" /> + <ngram occurrences="7" value="óû" /> + <ngram occurrences="7" value="óðà" /> + <ngram occurrences="7" value="òþ_" /> + <ngram occurrences="7" value="òðýõ" /> + <ngram occurrences="7" value="òïýáú" /> + <ngram occurrences="7" value="òïýá" /> + <ngram occurrences="7" value="òïý" /> + <ngram occurrences="7" value="ðòð" /> + <ngram occurrences="7" value="ðòïýá" /> + <ngram occurrences="7" value="ðòïý" /> + <ngram occurrences="7" value="ð_þ" /> + <ngram occurrences="7" value="ð_ýð" /> + <ngram occurrences="7" value="ð_ó" /> + <ngram occurrences="7" value="ð_àõ_" /> + <ngram occurrences="7" value="ð_ßþ" /> + <ngram occurrences="7" value="ïýáú" /> + <ngram occurrences="7" value="ïýá" /> + <ngram occurrences="7" value="ïý" /> + <ngram occurrences="7" value="ïòð" /> + <ngram occurrences="7" value="ïò" /> + <ngram occurrences="7" value="êû" /> + <ngram occurrences="7" value="éð" /> + <ngram occurrences="7" value="èðä" /> + <ngram occurrences="7" value="äø" /> + <ngram occurrences="7" value="äð" /> + <ngram occurrences="7" value="âýø" /> + <ngram occurrences="7" value="âú" /> + <ngram occurrences="7" value="âõýâý" /> + <ngram occurrences="7" value="âõýâ" /> +</ngrams> diff --git a/src/plugins/language/catalan.klp b/src/plugins/language/catalan.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="620" value="_" /> + <ngram occurrences="385" value="e" /> + <ngram occurrences="383" value="a" /> + <ngram occurrences="213" value="r" /> + <ngram occurrences="210" value="s" /> + <ngram occurrences="206" value="l" /> + <ngram occurrences="193" value="i" /> + <ngram occurrences="183" value="t" /> + <ngram occurrences="183" value="n" /> + <ngram occurrences="157" value="o" /> + <ngram occurrences="141" value="c" /> + <ngram occurrences="135" value="d" /> + <ngram occurrences="130" value="a_" /> + <ngram occurrences="126" value="u" /> + <ngram occurrences="108" value="s_" /> + <ngram occurrences="91" value="_d" /> + <ngram occurrences="87" value="p" /> + <ngram occurrences="87" value="m" /> + <ngram occurrences="86" value="e_" /> + <ngram occurrences="81" value="de" /> + <ngram occurrences="76" value="_de" /> + <ngram occurrences="71" value="es" /> + <ngram occurrences="70" value="l_" /> + <ngram occurrences="69" value="_l" /> + <ngram occurrences="68" value="_e" /> + <ngram occurrences="61" value="_a" /> + <ngram occurrences="54" value="_c" /> + <ngram occurrences="52" value="en" /> + <ngram occurrences="50" value="de_" /> + <ngram occurrences="50" value="_de_" /> + <ngram occurrences="47" value="_p" /> + <ngram occurrences="46" value="ta" /> + <ngram occurrences="46" value="el" /> + <ngram occurrences="44" value="la" /> + <ngram occurrences="43" value="ra" /> + <ngram occurrences="41" value="re" /> + <ngram occurrences="39" value="t_" /> + <ngram occurrences="39" value="an" /> + <ngram occurrences="38" value="er" /> + <ngram occurrences="38" value="ar" /> + <ngram occurrences="37" value="_la" /> + <ngram occurrences="36" value="es_" /> + <ngram occurrences="36" value="at" /> + <ngram occurrences="35" value="ci" /> + <ngram occurrences="34" value="n_" /> + <ngram occurrences="34" value="co" /> + <ngram occurrences="34" value="al" /> + <ngram occurrences="33" value="v" /> + <ngram occurrences="33" value="on" /> + <ngram occurrences="33" value="na" /> + <ngram occurrences="33" value="g" /> + <ngram occurrences="32" value="ue" /> + <ngram occurrences="32" value="_m" /> + <ngram occurrences="31" value="se" /> + <ngram occurrences="31" value="nt" /> + <ngram occurrences="31" value="_s" /> + <ngram occurrences="30" value="b" /> + <ngram occurrences="29" value="qu" /> + <ngram occurrences="29" value="q" /> + <ngram occurrences="29" value="la_" /> + <ngram occurrences="28" value="_la_" /> + <ngram occurrences="27" value="que" /> + <ngram occurrences="27" value="el_" /> + <ngram occurrences="26" value="st" /> + <ngram occurrences="26" value="or" /> + <ngram occurrences="26" value="e_l" /> + <ngram occurrences="25" value="s_d" /> + <ngram occurrences="25" value="r_" /> + <ngram occurrences="25" value="o_" /> + <ngram occurrences="25" value="_co" /> + <ngram occurrences="24" value="f" /> + <ngram occurrences="23" value="it" /> + <ngram occurrences="23" value="_t" /> + <ngram occurrences="23" value="_i" /> + <ngram occurrences="22" value="te" /> + <ngram occurrences="22" value="ac" /> + <ngram occurrences="22" value="_el" /> + <ngram occurrences="21" value="ur" /> + <ngram occurrences="21" value="ro" /> + <ngram occurrences="21" value="pr" /> + <ngram occurrences="21" value="me" /> + <ngram occurrences="21" value="i_" /> + <ngram occurrences="21" value="as" /> + <ngram occurrences="20" value="un" /> + <ngram occurrences="20" value="s_de" /> + <ngram occurrences="20" value="le" /> + <ngram occurrences="20" value="e_la" /> + <ngram occurrences="20" value="ca" /> + <ngram occurrences="19" value="à" /> + <ngram occurrences="19" value="ll" /> + <ngram occurrences="19" value="est" /> + <ngram occurrences="19" value="_se" /> + <ngram occurrences="18" value="ó" /> + <ngram occurrences="18" value="ma" /> + <ngram occurrences="18" value="ic" /> + <ngram occurrences="18" value="gu" /> + <ngram occurrences="18" value="de_l" /> + <ngram occurrences="18" value="_qu" /> + <ngram occurrences="18" value="_q" /> + <ngram occurrences="18" value="_de_l" /> + <ngram occurrences="17" value="tr" /> + <ngram occurrences="17" value="ti" /> + <ngram occurrences="17" value="pa" /> + <ngram occurrences="17" value="os" /> + <ngram occurrences="17" value="en_" /> + <ngram occurrences="17" value="e_la_" /> + <ngram occurrences="17" value="at_" /> + <ngram occurrences="17" value="a_d" /> + <ngram occurrences="17" value="_es" /> + <ngram occurrences="17" value="_el_" /> + <ngram occurrences="16" value="y" /> + <ngram occurrences="16" value="ue_" /> + <ngram occurrences="16" value="que_" /> + <ngram occurrences="16" value="pe" /> + <ngram occurrences="16" value="ns" /> + <ngram occurrences="16" value="li" /> + <ngram occurrences="16" value="ent" /> + <ngram occurrences="16" value="a_e" /> + <ngram occurrences="16" value="a_de" /> + <ngram occurrences="16" value="_que_" /> + <ngram occurrences="16" value="_que" /> + <ngram occurrences="16" value="_l_" /> + <ngram occurrences="15" value="ri" /> + <ngram occurrences="15" value="na_" /> + <ngram occurrences="15" value="mi" /> + <ngram occurrences="15" value="ia" /> + <ngram occurrences="15" value="as_" /> + <ngram occurrences="15" value="al_" /> + <ngram occurrences="15" value="_f" /> + <ngram occurrences="15" value="_en" /> + <ngram occurrences="14" value="va" /> + <ngram occurrences="14" value="sta" /> + <ngram occurrences="14" value="s_de_" /> + <ngram occurrences="14" value="ra_" /> + <ngram occurrences="14" value="po" /> + <ngram occurrences="14" value="in" /> + <ngram occurrences="14" value="de_la" /> + <ngram occurrences="14" value="da" /> + <ngram occurrences="14" value="aci" /> + <ngram occurrences="14" value="a_l" /> + <ngram occurrences="14" value="_pr" /> + <ngram occurrences="13" value="ne" /> + <ngram occurrences="13" value="io" /> + <ngram occurrences="13" value="ec" /> + <ngram occurrences="13" value="del" /> + <ngram occurrences="13" value="_v" /> + <ngram occurrences="13" value="_u" /> + <ngram occurrences="13" value="_del" /> + <ngram occurrences="12" value="ó_" /> + <ngram occurrences="12" value="à_" /> + <ngram occurrences="12" value="to" /> + <ngram occurrences="12" value="ta_" /> + <ngram occurrences="12" value="s_e" /> + <ngram occurrences="12" value="per" /> + <ngram occurrences="12" value="om" /> + <ngram occurrences="12" value="nt_" /> + <ngram occurrences="12" value="ni" /> + <ngram occurrences="12" value="ls_" /> + <ngram occurrences="12" value="ls" /> + <ngram occurrences="12" value="l_d" /> + <ngram occurrences="12" value="l_a" /> + <ngram occurrences="12" value="ió" /> + <ngram occurrences="12" value="ir" /> + <ngram occurrences="12" value="h" /> + <ngram occurrences="12" value="e_c" /> + <ngram occurrences="12" value="do" /> + <ngram occurrences="12" value="am" /> + <ngram occurrences="12" value="ad" /> + <ngram occurrences="12" value="_i_" /> + <ngram occurrences="12" value="_en_" /> + <ngram occurrences="12" value="_a_" /> + <ngram occurrences="11" value="y_" /> + <ngram occurrences="11" value="x" /> + <ngram occurrences="11" value="vi" /> + <ngram occurrences="11" value="ues" /> + <ngram occurrences="11" value="os_" /> + <ngram occurrences="11" value="ona" /> + <ngram occurrences="11" value="ol" /> + <ngram occurrences="11" value="men" /> + <ngram occurrences="11" value="ió_" /> + <ngram occurrences="11" value="ion" /> + <ngram occurrences="11" value="ie" /> + <ngram occurrences="11" value="ia_" /> + <ngram occurrences="11" value="esta" /> + <ngram occurrences="11" value="di" /> + <ngram occurrences="11" value="de_c" /> + <ngram occurrences="11" value="cu" /> + <ngram occurrences="11" value="ció" /> + <ngram occurrences="11" value="a_c" /> + <ngram occurrences="11" value="_r" /> + <ngram occurrences="11" value="_de_c" /> + <ngram occurrences="10" value="z" /> + <ngram occurrences="10" value="ura" /> + <ngram occurrences="10" value="ran" /> + <ngram occurrences="10" value="no" /> + <ngram occurrences="10" value="nd" /> + <ngram occurrences="10" value="es_d" /> + <ngram occurrences="10" value="e_a" /> + <ngram occurrences="10" value="ct" /> + <ngram occurrences="10" value="con" /> + <ngram occurrences="10" value="ció_" /> + <ngram occurrences="10" value="ació" /> + <ngram occurrences="10" value="_un" /> + <ngram occurrences="10" value="_re" /> + <ngram occurrences="10" value="_pe" /> + <ngram occurrences="10" value="_n" /> + <ngram occurrences="10" value="_al" /> + <ngram occurrences="9" value="s_c" /> + <ngram occurrences="9" value="rt" /> + <ngram occurrences="9" value="rs" /> + <ngram occurrences="9" value="res" /> + <ngram occurrences="9" value="rd" /> + <ngram occurrences="9" value="ques" /> + <ngram occurrences="9" value="pre" /> + <ngram occurrences="9" value="ons" /> + <ngram occurrences="9" value="nc" /> + <ngram occurrences="9" value="les" /> + <ngram occurrences="9" value="l_de" /> + <ngram occurrences="9" value="j" /> + <ngram occurrences="9" value="ep" /> + <ngram occurrences="9" value="ent_" /> + <ngram occurrences="9" value="em" /> + <ngram occurrences="9" value="des" /> + <ngram occurrences="9" value="del_" /> + <ngram occurrences="9" value="da_" /> + <ngram occurrences="9" value="com" /> + <ngram occurrences="9" value="ació_" /> + <ngram occurrences="9" value="a_m" /> + <ngram occurrences="9" value="_po" /> + <ngram occurrences="9" value="_ma" /> + <ngram occurrences="9" value="_del_" /> + <ngram occurrences="9" value="_com" /> + <ngram occurrences="9" value="_ca" /> + <ngram occurrences="8" value="va_" /> + <ngram occurrences="8" value="us" /> + <ngram occurrences="8" value="uest" /> + <ngram occurrences="8" value="tu" /> + <ngram occurrences="8" value="tiv" /> + <ngram occurrences="8" value="t_de" /> + <ngram occurrences="8" value="t_d" /> + <ngram occurrences="8" value="t_a" /> + <ngram occurrences="8" value="so" /> + <ngram occurrences="8" value="si" /> + <ngram occurrences="8" value="s_p" /> + <ngram occurrences="8" value="rn" /> + <ngram occurrences="8" value="nal" /> + <ngram occurrences="8" value="ment" /> + <ngram occurrences="8" value="les_" /> + <ngram occurrences="8" value="las_" /> + <ngram occurrences="8" value="las" /> + <ngram occurrences="8" value="iv" /> + <ngram occurrences="8" value="im" /> + <ngram occurrences="8" value="il" /> + <ngram occurrences="8" value="fi" /> + <ngram occurrences="8" value="eu" /> + <ngram occurrences="8" value="er_" /> + <ngram occurrences="8" value="ell" /> + <ngram occurrences="8" value="eg" /> + <ngram occurrences="8" value="ea" /> + <ngram occurrences="8" value="d_" /> + <ngram occurrences="8" value="cr" /> + <ngram occurrences="8" value="cio" /> + <ngram occurrences="8" value="cia" /> + <ngram occurrences="8" value="ara" /> + <ngram occurrences="8" value="a_t" /> + <ngram occurrences="8" value="a_s" /> + <ngram occurrences="8" value="a_qu" /> + <ngram occurrences="8" value="a_q" /> + <ngram occurrences="8" value="a_de_" /> + <ngram occurrences="8" value="a_a" /> + <ngram occurrences="8" value="_y" /> + <ngram occurrences="8" value="_pa" /> + <ngram occurrences="8" value="_l_a" /> + <ngram occurrences="8" value="_in" /> + <ngram occurrences="8" value="_h" /> + <ngram occurrences="8" value="_g" /> + <ngram occurrences="7" value="é" /> + <ngram occurrences="7" value="ura_" /> + <ngram occurrences="7" value="ul" /> + <ngram occurrences="7" value="tat" /> + <ngram occurrences="7" value="tas" /> + <ngram occurrences="7" value="sta_" /> + <ngram occurrences="7" value="s_i" /> + <ngram occurrences="7" value="s_f" /> + <ngram occurrences="7" value="ra_de" /> + <ngram occurrences="7" value="ra_d" /> + <ngram occurrences="7" value="quest" /> + <ngram occurrences="7" value="pro" /> + <ngram occurrences="7" value="par" /> + <ngram occurrences="7" value="oc" /> + <ngram occurrences="7" value="nta" /> + <ngram occurrences="7" value="nda" /> + <ngram occurrences="7" value="n_l" /> + <ngram occurrences="7" value="mp" /> + <ngram occurrences="7" value="ment_" /> + <ngram occurrences="7" value="l_e" /> + <ngram occurrences="7" value="l_de_" /> + <ngram occurrences="7" value="ita" /> + <ngram occurrences="7" value="iona" /> + <ngram occurrences="7" value="ha" /> + <ngram occurrences="7" value="et" /> + <ngram occurrences="7" value="es_de" /> + <ngram occurrences="7" value="era" /> + <ngram occurrences="7" value="els_" /> + <ngram occurrences="7" value="els" /> + <ngram occurrences="7" value="e_co" /> + <ngram occurrences="7" value="cor" /> + <ngram occurrences="7" value="cion" /> + <ngram occurrences="7" value="ba" /> + <ngram occurrences="7" value="ar_" /> + <ngram occurrences="7" value="aques" /> + <ngram occurrences="7" value="aque" /> + <ngram occurrences="7" value="aqu" /> + <ngram occurrences="7" value="aq" /> + <ngram occurrences="7" value="ant" /> + <ngram occurrences="7" value="and" /> + <ngram occurrences="7" value="ana" /> + <ngram occurrences="7" value="a_p" /> + <ngram occurrences="7" value="_ta" /> + <ngram occurrences="7" value="_per" /> + <ngram occurrences="7" value="_mi" /> + <ngram occurrences="7" value="_las_" /> + <ngram occurrences="7" value="_las" /> + <ngram occurrences="7" value="_fi" /> + <ngram occurrences="7" value="_des" /> + <ngram occurrences="7" value="_con" /> + <ngram occurrences="7" value="_aque" /> + <ngram occurrences="7" value="_aqu" /> + <ngram occurrences="7" value="_aq" /> + <ngram occurrences="7" value="_al_" /> + <ngram occurrences="6" value="í" /> + <ngram occurrences="6" value="ve" /> + <ngram occurrences="6" value="una_" /> + <ngram occurrences="6" value="una" /> + <ngram occurrences="6" value="ui" /> + <ngram occurrences="6" value="ua" /> + <ngram occurrences="6" value="tura_" /> + <ngram occurrences="6" value="tura" /> + <ngram occurrences="6" value="tur" /> + <ngram occurrences="6" value="ter" /> + <ngram occurrences="6" value="te_" /> + <ngram occurrences="6" value="tat_" /> + <ngram occurrences="6" value="tas_" /> + <ngram occurrences="6" value="tar" /> + <ngram occurrences="6" value="tam" /> + <ngram occurrences="6" value="t_de_" /> + <ngram occurrences="6" value="s_v" /> + <ngram occurrences="6" value="rà_" /> + <ngram occurrences="6" value="rà" /> + <ngram occurrences="6" value="ron" /> + <ngram occurrences="6" value="rne" /> + <ngram occurrences="6" value="rep" /> + <ngram occurrences="6" value="rec" /> + <ngram occurrences="6" value="rea" /> + <ngram occurrences="6" value="rac" /> + <ngram occurrences="6" value="para" /> + <ngram occurrences="6" value="ot" /> + <ngram occurrences="6" value="onal" /> + <ngram occurrences="6" value="ncia" /> + <ngram occurrences="6" value="nci" /> + <ngram occurrences="6" value="n_e" /> + <ngram occurrences="6" value="mar" /> + <ngram occurrences="6" value="m_" /> + <ngram occurrences="6" value="lt" /> + <ngram occurrences="6" value="lo" /> + <ngram occurrences="6" value="lle" /> + <ngram occurrences="6" value="ll_" /> + <ngram occurrences="6" value="l_p" /> + <ngram occurrences="6" value="l_c" /> + <ngram occurrences="6" value="ite" /> + <ngram occurrences="6" value="ir_" /> + <ngram occurrences="6" value="ional" /> + <ngram occurrences="6" value="ici" /> + <ngram occurrences="6" value="fa" /> + <ngram occurrences="6" value="en_e" /> + <ngram occurrences="6" value="el_p" /> + <ngram occurrences="6" value="ed" /> + <ngram occurrences="6" value="ect" /> + <ngram occurrences="6" value="e_p" /> + <ngram occurrences="6" value="de_co" /> + <ngram occurrences="6" value="cons" /> + <ngram occurrences="6" value="cia_" /> + <ngram occurrences="6" value="cat" /> + <ngram occurrences="6" value="ativ" /> + <ngram occurrences="6" value="ati" /> + <ngram occurrences="6" value="ana_" /> + <ngram occurrences="6" value="an_" /> + <ngram occurrences="6" value="a_que" /> + <ngram occurrences="6" value="a_la" /> + <ngram occurrences="6" value="a_l_" /> + <ngram occurrences="6" value="_y_" /> + <ngram occurrences="6" value="_una_" /> + <ngram occurrences="6" value="_una" /> + <ngram occurrences="6" value="_tr" /> + <ngram occurrences="6" value="_pre" /> + <ngram occurrences="6" value="_o" /> + <ngram occurrences="6" value="_no" /> + <ngram occurrences="6" value="_le" /> + <ngram occurrences="6" value="_ha" /> + <ngram occurrences="6" value="_es_" /> +</ngrams> diff --git a/src/plugins/language/chinese.klp b/src/plugins/language/chinese.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1385" value="_" /> + <ngram occurrences="178" value="¨" /> + <ngram occurrences="158" value="_¨" /> + <ngram occurrences="103" value="¸" /> + <ngram occurrences="92" value="_¸" /> + <ngram occurrences="76" value="ª" /> + <ngram occurrences="69" value="m" /> + <ngram occurrences="68" value="m_" /> + <ngram occurrences="64" value="_ª" /> + <ngram occurrences="64" value="_m_" /> + <ngram occurrences="64" value="_m" /> + <ngram occurrences="63" value="³" /> + <ngram occurrences="59" value="q" /> + <ngram occurrences="55" value="º" /> + <ngram occurrences="55" value="q_" /> + <ngram occurrences="54" value="½" /> + <ngram occurrences="50" value="¹" /> + <ngram occurrences="47" value="ó" /> + <ngram occurrences="47" value="ä" /> + <ngram occurrences="47" value="_½" /> + <ngram occurrences="46" value="µ" /> + <ngram occurrences="44" value="ó_" /> + <ngram occurrences="44" value="_³" /> + <ngram occurrences="43" value="¨_" /> + <ngram occurrences="41" value="à" /> + <ngram occurrences="39" value="²" /> + <ngram occurrences="38" value="ÿ" /> + <ngram occurrences="37" value="p" /> + <ngram occurrences="36" value="o" /> + <ngram occurrences="36" value="_¹" /> + <ngram occurrences="36" value="_µ" /> + <ngram occurrences="35" value="º_" /> + <ngram occurrences="35" value="o_" /> + <ngram occurrences="35" value="a_" /> + <ngram occurrences="35" value="a" /> + <ngram occurrences="35" value="_²" /> + <ngram occurrences="34" value="p_" /> + <ngram occurrences="34" value="c" /> + <ngram occurrences="34" value="_¨_" /> + <ngram occurrences="34" value="_à" /> + <ngram occurrences="34" value="_q" /> + <ngram occurrences="32" value="û" /> + <ngram occurrences="32" value="c_" /> + <ngram occurrences="31" value="_q_" /> + <ngram occurrences="31" value="_c_" /> + <ngram occurrences="31" value="_c" /> + <ngram occurrences="30" value="û_" /> + <ngram occurrences="30" value="á" /> + <ngram occurrences="30" value="_ÿ" /> + <ngram occurrences="29" value="ü_" /> + <ngram occurrences="29" value="ü" /> + <ngram occurrences="29" value="u" /> + <ngram occurrences="29" value="d" /> + <ngram occurrences="28" value="ªº" /> + <ngram occurrences="27" value="ø" /> + <ngram occurrences="27" value="w_" /> + <ngram occurrences="27" value="w" /> + <ngram occurrences="27" value="u_" /> + <ngram occurrences="26" value="ø_" /> + <ngram occurrences="26" value="h_" /> + <ngram occurrences="26" value="h" /> + <ngram occurrences="26" value="d_" /> + <ngram occurrences="25" value="ï" /> + <ngram occurrences="25" value="ä_" /> + <ngram occurrences="25" value="â" /> + <ngram occurrences="25" value="µ_" /> + <ngram occurrences="25" value="³_" /> + <ngram occurrences="25" value="b" /> + <ngram occurrences="25" value="_ó" /> + <ngram occurrences="25" value="_o" /> + <ngram occurrences="25" value="_d" /> + <ngram occurrences="24" value="ªº_" /> + <ngram occurrences="24" value="_ó_" /> + <ngram occurrences="24" value="_ªº_" /> + <ngram occurrences="24" value="_ªº" /> + <ngram occurrences="24" value="_o_" /> + <ngram occurrences="24" value="_d_" /> + <ngram occurrences="23" value="ç_" /> + <ngram occurrences="23" value="ç" /> + <ngram occurrences="23" value="æ" /> + <ngram occurrences="23" value="á_" /> + <ngram occurrences="23" value="b_" /> + <ngram occurrences="23" value="_á" /> + <ngram occurrences="23" value="_º" /> + <ngram occurrences="22" value="ï_" /> + <ngram occurrences="22" value="æ_" /> + <ngram occurrences="22" value="à_" /> + <ngram occurrences="22" value="ª_" /> + <ngram occurrences="22" value="g" /> + <ngram occurrences="22" value="_ä" /> + <ngram occurrences="21" value="ô_" /> + <ngram occurrences="21" value="ô" /> + <ngram occurrences="21" value="ò_" /> + <ngram occurrences="21" value="ò" /> + <ngram occurrences="21" value="ê" /> + <ngram occurrences="21" value="ã" /> + <ngram occurrences="21" value="_u" /> + <ngram occurrences="21" value="_h_" /> + <ngram occurrences="21" value="_h" /> + <ngram occurrences="20" value="½_" /> + <ngram occurrences="20" value="õ_" /> + <ngram occurrences="20" value="õ" /> + <ngram occurrences="20" value="ê_" /> + <ngram occurrences="20" value="é" /> + <ngram occurrences="20" value="t" /> + <ngram occurrences="20" value="f_" /> + <ngram occurrences="20" value="f" /> + <ngram occurrences="20" value="e" /> + <ngram occurrences="20" value="_â" /> + <ngram occurrences="20" value="_e" /> + <ngram occurrences="20" value="_a_" /> + <ngram occurrences="20" value="_a" /> + <ngram occurrences="19" value="l" /> + <ngram occurrences="19" value="g_" /> + <ngram occurrences="19" value="_é" /> + <ngram occurrences="19" value="_à_" /> + <ngram occurrences="19" value="_u_" /> + <ngram occurrences="18" value="é_" /> + <ngram occurrences="18" value="è_" /> + <ngram occurrences="18" value="è" /> + <ngram occurrences="18" value="å" /> + <ngram occurrences="18" value="â_" /> + <ngram occurrences="18" value="²_" /> + <ngram occurrences="18" value="x_" /> + <ngram occurrences="18" value="x" /> + <ngram occurrences="18" value="l_" /> + <ngram occurrences="18" value="_û" /> + <ngram occurrences="18" value="_g" /> + <ngram occurrences="17" value="¸_" /> + <ngram occurrences="17" value="t_" /> + <ngram occurrences="17" value="n" /> + <ngram occurrences="17" value="j_" /> + <ngram occurrences="17" value="j" /> + <ngram occurrences="17" value="e_" /> + <ngram occurrences="17" value="_û_" /> + <ngram occurrences="17" value="_é_" /> + <ngram occurrences="17" value="_µ_" /> + <ngram occurrences="17" value="_²_" /> + <ngram occurrences="17" value="_e_" /> + <ngram occurrences="16" value="¸ä" /> + <ngram occurrences="16" value="ð_" /> + <ngram occurrences="16" value="ð" /> + <ngram occurrences="16" value="ì_" /> + <ngram occurrences="16" value="ì" /> + <ngram occurrences="16" value="n_" /> + <ngram occurrences="16" value="_½_" /> + <ngram occurrences="16" value="_á_" /> + <ngram occurrences="16" value="_ª_" /> + <ngram occurrences="16" value="_t" /> + <ngram occurrences="15" value="ÿ_" /> + <ngram occurrences="15" value="ú" /> + <ngram occurrences="15" value="ö_" /> + <ngram occurrences="15" value="ö" /> + <ngram occurrences="15" value="î_" /> + <ngram occurrences="15" value="î" /> + <ngram occurrences="15" value="s_" /> + <ngram occurrences="15" value="s" /> + <ngram occurrences="15" value="_¸ä" /> + <ngram occurrences="15" value="_ã" /> + <ngram occurrences="15" value="_j_" /> + <ngram occurrences="15" value="_j" /> + <ngram occurrences="15" value="_g_" /> + <ngram occurrences="14" value="¸ä_" /> + <ngram occurrences="14" value="ú_" /> + <ngram occurrences="14" value="¹q" /> + <ngram occurrences="14" value="i_" /> + <ngram occurrences="14" value="i" /> + <ngram occurrences="14" value="_¸ä_" /> + <ngram occurrences="14" value="_ï" /> + <ngram occurrences="14" value="_è_" /> + <ngram occurrences="14" value="_è" /> + <ngram occurrences="14" value="_å" /> + <ngram occurrences="14" value="_w_" /> + <ngram occurrences="14" value="_w" /> + <ngram occurrences="14" value="_f_" /> + <ngram occurrences="14" value="_f" /> + <ngram occurrences="13" value="¨ó" /> + <ngram occurrences="13" value="ñ_" /> + <ngram occurrences="13" value="ñ" /> + <ngram occurrences="13" value="í_" /> + <ngram occurrences="13" value="í" /> + <ngram occurrences="13" value="¹q_" /> + <ngram occurrences="13" value="v_" /> + <ngram occurrences="13" value="v" /> + <ngram occurrences="13" value="k" /> + <ngram occurrences="13" value="_õ_" /> + <ngram occurrences="13" value="_õ" /> + <ngram occurrences="13" value="_ð_" /> + <ngram occurrences="13" value="_ð" /> + <ngram occurrences="13" value="_î_" /> + <ngram occurrences="13" value="_î" /> + <ngram occurrences="13" value="_â_" /> + <ngram occurrences="13" value="_t_" /> + <ngram occurrences="13" value="_p" /> + <ngram occurrences="13" value="_i_" /> + <ngram occurrences="13" value="_i" /> + <ngram occurrences="12" value="¨b_" /> + <ngram occurrences="12" value="¨b" /> + <ngram occurrences="12" value="ÿç_" /> + <ngram occurrences="12" value="ÿç" /> + <ngram occurrences="12" value="ë" /> + <ngram occurrences="12" value="k_" /> + <ngram occurrences="12" value="_¨b_" /> + <ngram occurrences="12" value="_¨b" /> + <ngram occurrences="12" value="_ÿç_" /> + <ngram occurrences="12" value="_ÿç" /> + <ngram occurrences="12" value="_¹q" /> + <ngram occurrences="12" value="_p_" /> + <ngram occurrences="11" value="¨ó_" /> + <ngram occurrences="11" value="¨p" /> + <ngram occurrences="11" value="ë_" /> + <ngram occurrences="11" value="m_¨" /> + <ngram occurrences="11" value="_¸_" /> + <ngram occurrences="11" value="_ï_" /> + <ngram occurrences="11" value="_ç_" /> + <ngram occurrences="11" value="_ç" /> + <ngram occurrences="11" value="_¹q_" /> + <ngram occurrences="11" value="_x_" /> + <ngram occurrences="11" value="_x" /> + <ngram occurrences="11" value="_m_¨" /> + <ngram occurrences="11" value="_l_" /> + <ngram occurrences="11" value="_l" /> + <ngram occurrences="11" value="__" /> + <ngram occurrences="10" value="¨æ_" /> + <ngram occurrences="10" value="¨æ" /> + <ngram occurrences="10" value="_¨æ_" /> + <ngram occurrences="10" value="_¨æ" /> + <ngram occurrences="10" value="_¨p" /> + <ngram occurrences="10" value="_ÿ_" /> + <ngram occurrences="10" value="_ü_" /> + <ngram occurrences="10" value="_ü" /> + <ngram occurrences="10" value="_ö_" /> + <ngram occurrences="10" value="_ö" /> + <ngram occurrences="10" value="_ô_" /> + <ngram occurrences="10" value="_ô" /> + <ngram occurrences="10" value="_º_" /> + <ngram occurrences="10" value="_s_" /> + <ngram occurrences="10" value="_s" /> + <ngram occurrences="9" value="¸ü_" /> + <ngram occurrences="9" value="¸ü" /> + <ngram occurrences="9" value="¨p_" /> + <ngram occurrences="9" value="ù" /> + <ngram occurrences="9" value="³q_" /> + <ngram occurrences="9" value="³q" /> + <ngram occurrences="9" value="q_¸" /> + <ngram occurrences="9" value="_¸ü_" /> + <ngram occurrences="9" value="_¸ü" /> + <ngram occurrences="9" value="_¨p_" /> + <ngram occurrences="9" value="_ø_" /> + <ngram occurrences="9" value="_ø" /> + <ngram occurrences="9" value="_³q_" /> + <ngram occurrences="9" value="_³q" /> + <ngram occurrences="9" value="_³_" /> + <ngram occurrences="9" value="_k" /> + <ngram occurrences="8" value="¸û_" /> + <ngram occurrences="8" value="¸û" /> + <ngram occurrences="8" value="¨ü_" /> + <ngram occurrences="8" value="¨ü" /> + <ngram occurrences="8" value="¨³_" /> + <ngram occurrences="8" value="¨³" /> + <ngram occurrences="8" value="¨a_" /> + <ngram occurrences="8" value="¨a" /> + <ngram occurrences="8" value="¨_¨" /> + <ngram occurrences="8" value="ù_" /> + <ngram occurrences="8" value="å_" /> + <ngram occurrences="8" value="¹_" /> + <ngram occurrences="8" value="ªø_" /> + <ngram occurrences="8" value="ªø" /> + <ngram occurrences="8" value="q_¨" /> + <ngram occurrences="8" value="m_¸" /> + <ngram occurrences="8" value="_¸û_" /> + <ngram occurrences="8" value="_¸û" /> + <ngram occurrences="8" value="_¨ü_" /> + <ngram occurrences="8" value="_¨ü" /> + <ngram occurrences="8" value="_¨³_" /> + <ngram occurrences="8" value="_¨³" /> + <ngram occurrences="8" value="_¨a_" /> + <ngram occurrences="8" value="_¨a" /> + <ngram occurrences="8" value="_ù" /> + <ngram occurrences="8" value="_ò_" /> + <ngram occurrences="8" value="_ò" /> + <ngram occurrences="8" value="_ñ_" /> + <ngram occurrences="8" value="_ñ" /> + <ngram occurrences="8" value="_ë" /> + <ngram occurrences="8" value="_æ_" /> + <ngram occurrences="8" value="_æ" /> + <ngram occurrences="8" value="_ªø_" /> + <ngram occurrences="8" value="_ªø" /> + <ngram occurrences="8" value="_q_¨" /> + <ngram occurrences="8" value="_n_" /> + <ngram occurrences="8" value="_n" /> + <ngram occurrences="8" value="_m_¸" /> + <ngram occurrences="8" value="_k_" /> + <ngram occurrences="8" value="_b_" /> + <ngram occurrences="8" value="_b" /> + <ngram occurrences="7" value="¸p_" /> + <ngram occurrences="7" value="¸p" /> + <ngram occurrences="7" value="¨ì_" /> + <ngram occurrences="7" value="¨ì" /> + <ngram occurrences="7" value="¨w_" /> + <ngram occurrences="7" value="¨w" /> + <ngram occurrences="7" value="ã_" /> + <ngram occurrences="7" value="¹q_¸ü" /> + <ngram occurrences="7" value="¹q_¸" /> + <ngram occurrences="7" value="³_¨" /> + <ngram occurrences="7" value="q_¸ü_" /> + <ngram occurrences="7" value="q_¸ü" /> + <ngram occurrences="7" value="o_¨" /> + <ngram occurrences="7" value="_¸p_" /> + <ngram occurrences="7" value="_¸p" /> + <ngram occurrences="7" value="_¨ó_" /> + <ngram occurrences="7" value="_¨ó" /> + <ngram occurrences="7" value="_¨ì_" /> + <ngram occurrences="7" value="_¨ì" /> + <ngram occurrences="7" value="_¨w_" /> + <ngram occurrences="7" value="_¨w" /> + <ngram occurrences="7" value="_ù_" /> + <ngram occurrences="7" value="_ë_" /> + <ngram occurrences="7" value="_ê" /> + <ngram occurrences="7" value="_¹q_¸" /> + <ngram occurrences="7" value="_v_" /> + <ngram occurrences="7" value="_v" /> + <ngram occurrences="6" value="¸ó_" /> + <ngram occurrences="6" value="¸ó" /> + <ngram occurrences="6" value="¸ê_" /> + <ngram occurrences="6" value="¸ê" /> + <ngram occurrences="6" value="¨ê_" /> + <ngram occurrences="6" value="¨ê" /> + <ngram occurrences="6" value="¨_g" /> + <ngram occurrences="6" value="ý_" /> + <ngram occurrences="6" value="ý" /> + <ngram occurrences="6" value="äµ_" /> + <ngram occurrences="6" value="äµ" /> + <ngram occurrences="6" value="º_¨" /> + <ngram occurrences="6" value="µo_" /> + <ngram occurrences="6" value="µo" /> + <ngram occurrences="6" value="²ä_" /> + <ngram occurrences="6" value="²ä" /> + <ngram occurrences="6" value="d_c_" /> + <ngram occurrences="6" value="d_c" /> + <ngram occurrences="6" value="_¸ó_" /> + <ngram occurrences="6" value="_¸ó" /> + <ngram occurrences="6" value="_¸ê_" /> + <ngram occurrences="6" value="_¸ê" /> + <ngram occurrences="6" value="_¨ê_" /> + <ngram occurrences="6" value="_¨ê" /> + <ngram occurrences="6" value="_¨_¨" /> + <ngram occurrences="6" value="_ú_" /> + <ngram occurrences="6" value="_ú" /> + <ngram occurrences="6" value="_í_" /> + <ngram occurrences="6" value="_í" /> + <ngram occurrences="6" value="_ê_" /> + <ngram occurrences="6" value="_å_" /> + <ngram occurrences="6" value="_äµ_" /> + <ngram occurrences="6" value="_äµ" /> + <ngram occurrences="6" value="_µo_" /> + <ngram occurrences="6" value="_µo" /> + <ngram occurrences="6" value="_²ä_" /> + <ngram occurrences="6" value="_²ä" /> + <ngram occurrences="6" value="_o_¨" /> + <ngram occurrences="6" value="_d_c_" /> + <ngram occurrences="6" value="_d_c" /> + <ngram occurrences="5" value="¨â_" /> + <ngram occurrences="5" value="¨â" /> + <ngram occurrences="5" value="½u_" /> + <ngram occurrences="5" value="½u" /> + <ngram occurrences="5" value="½_¨" /> + <ngram occurrences="5" value="ä_q_" /> + <ngram occurrences="5" value="ä_q" /> + <ngram occurrences="5" value="á_¨" /> + <ngram occurrences="5" value="²ä_q_" /> + <ngram occurrences="5" value="²ä_q" /> + <ngram occurrences="5" value="z" /> + <ngram occurrences="5" value="y" /> + <ngram occurrences="5" value="t_¨" /> + <ngram occurrences="5" value="p_ª" /> + <ngram occurrences="5" value="i_¨" /> + <ngram occurrences="5" value="f_¨" /> + <ngram occurrences="5" value="_½u_" /> + <ngram occurrences="5" value="_½u" /> + <ngram occurrences="5" value="_²ä_q" /> + <ngram occurrences="5" value="_i_¨" /> + <ngram occurrences="5" value="___" /> + <ngram occurrences="4" value="¸ô_" /> + <ngram occurrences="4" value="¸ô" /> + <ngram occurrences="4" value="¸ë_" /> + <ngram occurrences="4" value="¸ë" /> + <ngram occurrences="4" value="¸_x_" /> + <ngram occurrences="4" value="¸_x" /> + <ngram occurrences="4" value="¨¸_" /> + <ngram occurrences="4" value="¨¸" /> + <ngram occurrences="4" value="¨ï_" /> + <ngram occurrences="4" value="¨ï" /> + <ngram occurrences="4" value="¨n_" /> + <ngram occurrences="4" value="¨n" /> + <ngram occurrences="4" value="¨_ª" /> + <ngram occurrences="4" value="½õ_d_" /> + <ngram occurrences="4" value="½õ_d" /> + <ngram occurrences="4" value="½õ_" /> + <ngram occurrences="4" value="½õ" /> +</ngrams> diff --git a/src/plugins/language/chinese1.klp b/src/plugins/language/chinese1.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1172" value="_" /> + <ngram occurrences="143" value="½" /> + <ngram occurrences="141" value="µ" /> + <ngram occurrences="112" value="¹" /> + <ngram occurrences="106" value="ö" /> + <ngram occurrences="105" value="_µ" /> + <ngram occurrences="103" value="ä" /> + <ngram occurrences="94" value="ê" /> + <ngram occurrences="91" value="¸" /> + <ngram occurrences="90" value="ú" /> + <ngram occurrences="89" value="ë" /> + <ngram occurrences="81" value="ð" /> + <ngram occurrences="78" value="õ" /> + <ngram occurrences="77" value="_½" /> + <ngram occurrences="76" value="á" /> + <ngram occurrences="75" value="ò" /> + <ngram occurrences="74" value="î" /> + <ngram occurrences="71" value="_¹" /> + <ngram occurrences="70" value="è" /> + <ngram occurrences="70" value="ä_" /> + <ngram occurrences="69" value="ó" /> + <ngram occurrences="69" value="é" /> + <ngram occurrences="68" value="í" /> + <ngram occurrences="67" value="ï" /> + <ngram occurrences="67" value="à" /> + <ngram occurrences="64" value="ú_" /> + <ngram occurrences="63" value="²" /> + <ngram occurrences="62" value="ô" /> + <ngram occurrences="57" value="ö_" /> + <ngram occurrences="57" value="_¸" /> + <ngram occurrences="56" value="ã" /> + <ngram occurrences="54" value="ë_" /> + <ngram occurrences="53" value="_ö" /> + <ngram occurrences="52" value="ÿ" /> + <ngram occurrences="52" value="ç" /> + <ngram occurrences="52" value="â" /> + <ngram occurrences="52" value="µä_" /> + <ngram occurrences="52" value="µä" /> + <ngram occurrences="52" value="_µä_" /> + <ngram occurrences="52" value="_µä" /> + <ngram occurrences="51" value="ñ" /> + <ngram occurrences="51" value="_á" /> + <ngram occurrences="50" value="½_" /> + <ngram occurrences="49" value="ø" /> + <ngram occurrences="49" value="¹_" /> + <ngram occurrences="49" value="³" /> + <ngram occurrences="45" value="ì" /> + <ngram occurrences="44" value="_î" /> + <ngram occurrences="43" value="_è" /> + <ngram occurrences="40" value="µ_" /> + <ngram occurrences="40" value="_ê" /> + <ngram occurrences="40" value="_²" /> + <ngram occurrences="39" value="_ô" /> + <ngram occurrences="38" value="¸_" /> + <ngram occurrences="38" value="ê_" /> + <ngram occurrences="38" value="_õ" /> + <ngram occurrences="37" value="å" /> + <ngram occurrences="37" value="º" /> + <ngram occurrences="35" value="ð_" /> + <ngram occurrences="35" value="í_" /> + <ngram occurrences="35" value="_ó" /> + <ngram occurrences="34" value="æ" /> + <ngram occurrences="34" value="²_" /> + <ngram occurrences="34" value="_ò" /> + <ngram occurrences="34" value="_é" /> + <ngram occurrences="33" value="î_" /> + <ngram occurrences="33" value="ª" /> + <ngram occurrences="33" value="_ÿ" /> + <ngram occurrences="33" value="_à" /> + <ngram occurrences="32" value="¨" /> + <ngram occurrences="32" value="_¹_" /> + <ngram occurrences="31" value="ï_" /> + <ngram occurrences="31" value="ç_" /> + <ngram occurrences="31" value="_ë" /> + <ngram occurrences="30" value="ù" /> + <ngram occurrences="28" value="ü" /> + <ngram occurrences="28" value="ø_" /> + <ngram occurrences="28" value="ñ_" /> + <ngram occurrences="27" value="â_" /> + <ngram occurrences="27" value="¹ú" /> + <ngram occurrences="27" value="_í" /> + <ngram occurrences="26" value="è_" /> + <ngram occurrences="26" value="ª_" /> + <ngram occurrences="25" value="ý" /> + <ngram occurrences="25" value="û" /> + <ngram occurrences="25" value="ó_" /> + <ngram occurrences="25" value="ò_" /> + <ngram occurrences="25" value="é_" /> + <ngram occurrences="25" value="à_" /> + <ngram occurrences="25" value="_ï" /> + <ngram occurrences="24" value="_ö_" /> + <ngram occurrences="24" value="_ä" /> + <ngram occurrences="24" value="_²_" /> + <ngram occurrences="23" value="õ_" /> + <ngram occurrences="23" value="å_" /> + <ngram occurrences="23" value="áë_" /> + <ngram occurrences="23" value="áë" /> + <ngram occurrences="23" value="_º" /> + <ngram occurrences="22" value="ù_" /> + <ngram occurrences="22" value="_ð" /> + <ngram occurrences="22" value="_ì" /> + <ngram occurrences="22" value="_µ_" /> + <ngram occurrences="21" value="ô_" /> + <ngram occurrences="21" value="_¸_" /> + <ngram occurrences="21" value="_ã" /> + <ngram occurrences="21" value="_áë_" /> + <ngram occurrences="21" value="_áë" /> + <ngram occurrences="20" value="þ" /> + <ngram occurrences="20" value="ôú" /> + <ngram occurrences="20" value="äê" /> + <ngram occurrences="20" value="ã_" /> + <ngram occurrences="20" value="³_" /> + <ngram occurrences="20" value="_æ" /> + <ngram occurrences="20" value="_³" /> + <ngram occurrences="19" value="ôú_" /> + <ngram occurrences="19" value="¹ú_" /> + <ngram occurrences="18" value="¨_" /> + <ngram occurrences="18" value="ý_" /> + <ngram occurrences="17" value="_ôú" /> + <ngram occurrences="17" value="_ê_" /> + <ngram occurrences="16" value="ÿ_" /> + <ngram occurrences="16" value="ðð" /> + <ngram occurrences="16" value="ì_" /> + <ngram occurrences="16" value="_ôú_" /> + <ngram occurrences="16" value="_ñ" /> + <ngram occurrences="16" value="_å" /> + <ngram occurrences="15" value="û_" /> + <ngram occurrences="15" value="_à_" /> + <ngram occurrences="14" value="ü_" /> + <ngram occurrences="14" value="èë" /> + <ngram occurrences="14" value="_½_" /> + <ngram occurrences="14" value="_äê" /> + <ngram occurrences="13" value="æ_" /> + <ngram occurrences="13" value="äê_" /> + <ngram occurrences="13" value="á_" /> + <ngram occurrences="13" value="_ç" /> + <ngram occurrences="12" value="³ö_" /> + <ngram occurrences="12" value="³ö" /> + <ngram occurrences="12" value="_î_" /> + <ngram occurrences="12" value="_è_" /> + <ngram occurrences="11" value="¸ó" /> + <ngram occurrences="11" value="öð" /> + <ngram occurrences="11" value="ðð_" /> + <ngram occurrences="11" value="ºí" /> + <ngram occurrences="11" value="µ½_" /> + <ngram occurrences="11" value="µ½" /> + <ngram occurrences="11" value="_¨" /> + <ngram occurrences="11" value="_ó_" /> + <ngram occurrences="11" value="_å_" /> + <ngram occurrences="11" value="_¹ú" /> + <ngram occurrences="10" value="õþ" /> + <ngram occurrences="10" value="éï" /> + <ngram occurrences="10" value="ãñ" /> + <ngram occurrences="10" value="ºí_" /> + <ngram occurrences="10" value="º_" /> + <ngram occurrences="10" value="_ù_" /> + <ngram occurrences="10" value="_ù" /> + <ngram occurrences="10" value="_öð" /> + <ngram occurrences="10" value="_ë_" /> + <ngram occurrences="10" value="_äê_" /> + <ngram occurrences="10" value="_ºí_" /> + <ngram occurrences="10" value="_ºí" /> + <ngram occurrences="10" value="_ª" /> + <ngram occurrences="9" value="½¨" /> + <ngram occurrences="9" value="½ø" /> + <ngram occurrences="9" value="õâ" /> + <ngram occurrences="9" value="ãç_" /> + <ngram occurrences="9" value="ãç" /> + <ngram occurrences="9" value="ß" /> + <ngram occurrences="9" value="_¸ó" /> + <ngram occurrences="9" value="_ú" /> + <ngram occurrences="9" value="_ô_" /> + <ngram occurrences="9" value="_éï" /> + <ngram occurrences="9" value="_â" /> + <ngram occurrences="9" value="_ª_" /> + <ngram occurrences="8" value="¸ö" /> + <ngram occurrences="8" value="ÿü" /> + <ngram occurrences="8" value="ÿù" /> + <ngram occurrences="8" value="àí" /> + <ngram occurrences="8" value="ß_" /> + <ngram occurrences="8" value="µø" /> + <ngram occurrences="8" value="µã" /> + <ngram occurrences="8" value="²ú" /> + <ngram occurrences="8" value="_½¨" /> + <ngram occurrences="8" value="_ÿù" /> + <ngram occurrences="8" value="_ÿ_" /> + <ngram occurrences="8" value="_õþ" /> + <ngram occurrences="8" value="_õâ" /> + <ngram occurrences="8" value="_ï_" /> + <ngram occurrences="7" value="¸ö_" /> + <ngram occurrences="7" value="½_¹" /> + <ngram occurrences="7" value="½_µ" /> + <ngram occurrences="7" value="ÿö" /> + <ngram occurrences="7" value="þ_" /> + <ngram occurrences="7" value="øð" /> + <ngram occurrences="7" value="òµ" /> + <ngram occurrences="7" value="îä" /> + <ngram occurrences="7" value="êõ" /> + <ngram occurrences="7" value="éï_" /> + <ngram occurrences="7" value="èõ" /> + <ngram occurrences="7" value="èë_" /> + <ngram occurrences="7" value="ãñ_" /> + <ngram occurrences="7" value="à¸_" /> + <ngram occurrences="7" value="à¸" /> + <ngram occurrences="7" value="¹ø" /> + <ngram occurrences="7" value="¹_µ" /> + <ngram occurrences="7" value="_¨_" /> + <ngram occurrences="7" value="_½ø" /> + <ngram occurrences="7" value="_ò_" /> + <ngram occurrences="7" value="_ñ_" /> + <ngram occurrences="7" value="_îä" /> + <ngram occurrences="7" value="_ì_" /> + <ngram occurrences="7" value="_èõ" /> + <ngram occurrences="7" value="_èë" /> + <ngram occurrences="7" value="_µã" /> + <ngram occurrences="7" value="_³ö_" /> + <ngram occurrences="7" value="_³ö" /> + <ngram occurrences="7" value="_³_" /> + <ngram occurrences="6" value="¸ó_" /> + <ngram occurrences="6" value="½½" /> + <ngram occurrences="6" value="½ü" /> + <ngram occurrences="6" value="ú½" /> + <ngram occurrences="6" value="ú_¸" /> + <ngram occurrences="6" value="ö_ö" /> + <ngram occurrences="6" value="ö_¹" /> + <ngram occurrences="6" value="ö_µ" /> + <ngram occurrences="6" value="õâ_" /> + <ngram occurrences="6" value="õ¹" /> + <ngram occurrences="6" value="òé_" /> + <ngram occurrences="6" value="òé" /> + <ngram occurrences="6" value="òµ_" /> + <ngram occurrences="6" value="ð_µ" /> + <ngram occurrences="6" value="îò" /> + <ngram occurrences="6" value="îê" /> + <ngram occurrences="6" value="íò_" /> + <ngram occurrences="6" value="íò" /> + <ngram occurrences="6" value="ëû" /> + <ngram occurrences="6" value="ë_½" /> + <ngram occurrences="6" value="ê_µ" /> + <ngram occurrences="6" value="èõ_" /> + <ngram occurrences="6" value="ä_½" /> + <ngram occurrences="6" value="àí_" /> + <ngram occurrences="6" value="¹²" /> + <ngram occurrences="6" value="µø_" /> + <ngram occurrences="6" value="µ_¸" /> + <ngram occurrences="6" value="_¸ö" /> + <ngram occurrences="6" value="_ú_" /> + <ngram occurrences="6" value="_îò" /> + <ngram occurrences="6" value="_íò_" /> + <ngram occurrences="6" value="_íò" /> + <ngram occurrences="6" value="_í_" /> + <ngram occurrences="6" value="_ëû" /> + <ngram occurrences="6" value="_éï_" /> + <ngram occurrences="6" value="_èõ_" /> + <ngram occurrences="6" value="_¹²" /> + <ngram occurrences="6" value="_µ½_" /> + <ngram occurrences="6" value="_µ½" /> + <ngram occurrences="6" value="_µø" /> + <ngram occurrences="5" value="½¸_" /> + <ngram occurrences="5" value="½¸" /> + <ngram occurrences="5" value="½ê" /> + <ngram occurrences="5" value="ÿö_" /> + <ngram occurrences="5" value="ú_µ" /> + <ngram occurrences="5" value="øðð" /> + <ngram occurrences="5" value="öî_" /> + <ngram occurrences="5" value="öî" /> + <ngram occurrences="5" value="ö_ö_" /> + <ngram occurrences="5" value="ô½_" /> + <ngram occurrences="5" value="ô½" /> + <ngram occurrences="5" value="óú" /> + <ngram occurrences="5" value="óð_" /> + <ngram occurrences="5" value="óð" /> + <ngram occurrences="5" value="óã" /> + <ngram occurrences="5" value="ðô" /> + <ngram occurrences="5" value="ðâ" /> + <ngram occurrences="5" value="ð_á" /> + <ngram occurrences="5" value="ïµ" /> + <ngram occurrences="5" value="ï_½" /> + <ngram occurrences="5" value="ìâ_" /> + <ngram occurrences="5" value="ìâ" /> + <ngram occurrences="5" value="ìá" /> + <ngram occurrences="5" value="ì_µ" /> + <ngram occurrences="5" value="ë_õ" /> + <ngram occurrences="5" value="êç" /> + <ngram occurrences="5" value="êâ" /> + <ngram occurrences="5" value="êà" /> + <ngram occurrences="5" value="êµ" /> + <ngram occurrences="5" value="éú" /> + <ngram occurrences="5" value="çø_" /> + <ngram occurrences="5" value="çø" /> + <ngram occurrences="5" value="ä_ö" /> + <ngram occurrences="5" value="ä_é" /> + <ngram occurrences="5" value="ä_¹" /> + <ngram occurrences="5" value="á¨_" /> + <ngram occurrences="5" value="á¨" /> + <ngram occurrences="5" value="áª" /> + <ngram occurrences="5" value="ºï" /> + <ngram occurrences="5" value="¹ý" /> + <ngram occurrences="5" value="¹_¸" /> + <ngram occurrences="5" value="µä_¹" /> + <ngram occurrences="5" value="µã_" /> + <ngram occurrences="5" value="³é" /> + <ngram occurrences="5" value="_¸ö_" /> + <ngram occurrences="5" value="_½¸_" /> + <ngram occurrences="5" value="_½¸" /> + <ngram occurrences="5" value="_½½" /> + <ngram occurrences="5" value="_ÿü" /> + <ngram occurrences="5" value="_ö_ö" /> + <ngram occurrences="5" value="_ö_¹" /> + <ngram occurrences="5" value="_õâ_" /> + <ngram occurrences="5" value="_ðâ" /> + <ngram occurrences="5" value="_ð_" /> + <ngram occurrences="5" value="_îê" /> + <ngram occurrences="5" value="_ìá" /> + <ngram occurrences="5" value="_ãñ" /> + <ngram occurrences="5" value="_ã_" /> + <ngram occurrences="5" value="_á_" /> + <ngram occurrences="5" value="_¹ý" /> + <ngram occurrences="5" value="_¹ø" /> + <ngram occurrences="5" value="_¹_¸" /> + <ngram occurrences="5" value="_µø_" /> + <ngram occurrences="5" value="_µä_¹" /> + <ngram occurrences="5" value="_²ú" /> + <ngram occurrences="4" value="¸ï" /> + <ngram occurrences="4" value="¸_ö" /> + <ngram occurrences="4" value="¸_í" /> + <ngram occurrences="4" value="¸_¹" /> + <ngram occurrences="4" value="¸_µ" /> + <ngram occurrences="4" value="½û" /> + <ngram occurrences="4" value="½øðð_" /> + <ngram occurrences="4" value="½øðð" /> + <ngram occurrences="4" value="½øð" /> + <ngram occurrences="4" value="½ò" /> + <ngram occurrences="4" value="½ì" /> + <ngram occurrences="4" value="½ç" /> + <ngram occurrences="4" value="½æ" /> + <ngram occurrences="4" value="½ä" /> + <ngram occurrences="4" value="½â" /> + <ngram occurrences="4" value="½_õ" /> + <ngram occurrences="4" value="½_µä_" /> + <ngram occurrences="4" value="½_µä" /> + <ngram occurrences="4" value="ÿí_" /> + <ngram occurrences="4" value="ÿí" /> + <ngram occurrences="4" value="ÿ_½" /> + <ngram occurrences="4" value="þöî_" /> + <ngram occurrences="4" value="þöî" /> + <ngram occurrences="4" value="þö" /> + <ngram occurrences="4" value="þ²" /> + <ngram occurrences="4" value="û_ë" /> + <ngram occurrences="4" value="ú¹" /> + <ngram occurrences="4" value="ú_õ" /> + <ngram occurrences="4" value="ú_î" /> + <ngram occurrences="4" value="ú_í" /> + <ngram occurrences="4" value="ú_²" /> + <ngram occurrences="4" value="ù_ö_ö" /> + <ngram occurrences="4" value="ù_ö_" /> + <ngram occurrences="4" value="ù_ö" /> + <ngram occurrences="4" value="øðð_" /> + <ngram occurrences="4" value="ø_ÿ" /> + <ngram occurrences="4" value="öø" /> + <ngram occurrences="4" value="öðð" /> + <ngram occurrences="4" value="öð_" /> + <ngram occurrences="4" value="ö_ò" /> + <ngram occurrences="4" value="ö_á" /> + <ngram occurrences="4" value="ö_¹_" /> + <ngram occurrences="4" value="õ½" /> + <ngram occurrences="4" value="õþöî_" /> + <ngram occurrences="4" value="õþöî" /> + <ngram occurrences="4" value="õþö" /> + <ngram occurrences="4" value="õ¹_" /> + <ngram occurrences="4" value="ôª_" /> + <ngram occurrences="4" value="ôª" /> + <ngram occurrences="4" value="óú_" /> + <ngram occurrences="4" value="óª" /> + <ngram occurrences="4" value="ó_¹" /> + <ngram occurrences="4" value="òñ_" /> + <ngram occurrences="4" value="òñ" /> + <ngram occurrences="4" value="òª_" /> + <ngram occurrences="4" value="òª" /> + <ngram occurrences="4" value="ñ_µä_" /> + <ngram occurrences="4" value="ñ_µä" /> + <ngram occurrences="4" value="ñ_µ" /> + <ngram occurrences="4" value="ð_áë_" /> + <ngram occurrences="4" value="ð_áë" /> + <ngram occurrences="4" value="ïø_" /> + <ngram occurrences="4" value="ïø" /> + <ngram occurrences="4" value="îêìâ_" /> + <ngram occurrences="4" value="îêìâ" /> + <ngram occurrences="4" value="îêì" /> + <ngram occurrences="4" value="îä_" /> + <ngram occurrences="4" value="îª_" /> + <ngram occurrences="4" value="îª" /> + <ngram occurrences="4" value="í_½" /> + <ngram occurrences="4" value="ìõ" /> + <ngram occurrences="4" value="ëû_" /> + <ngram occurrences="4" value="ëã" /> + <ngram occurrences="4" value="ëµ_" /> + <ngram occurrences="4" value="ëµ" /> + <ngram occurrences="4" value="ë_ê" /> + <ngram occurrences="4" value="ë_é" /> +</ngrams> diff --git a/src/plugins/language/chinese2.klp b/src/plugins/language/chinese2.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1172" value="_" /> + <ngram occurrences="143" value="½" /> + <ngram occurrences="141" value="µ" /> + <ngram occurrences="112" value="¹" /> + <ngram occurrences="106" value="ö" /> + <ngram occurrences="105" value="_µ" /> + <ngram occurrences="103" value="ä" /> + <ngram occurrences="94" value="ê" /> + <ngram occurrences="91" value="¸" /> + <ngram occurrences="90" value="ú" /> + <ngram occurrences="89" value="ë" /> + <ngram occurrences="81" value="ð" /> + <ngram occurrences="78" value="õ" /> + <ngram occurrences="77" value="_½" /> + <ngram occurrences="76" value="á" /> + <ngram occurrences="75" value="ò" /> + <ngram occurrences="74" value="î" /> + <ngram occurrences="71" value="_¹" /> + <ngram occurrences="70" value="è" /> + <ngram occurrences="70" value="ä_" /> + <ngram occurrences="69" value="ó" /> + <ngram occurrences="69" value="é" /> + <ngram occurrences="68" value="í" /> + <ngram occurrences="67" value="ï" /> + <ngram occurrences="67" value="à" /> + <ngram occurrences="64" value="ú_" /> + <ngram occurrences="63" value="²" /> + <ngram occurrences="62" value="ô" /> + <ngram occurrences="57" value="ö_" /> + <ngram occurrences="57" value="_¸" /> + <ngram occurrences="56" value="ã" /> + <ngram occurrences="54" value="ë_" /> + <ngram occurrences="53" value="_ö" /> + <ngram occurrences="52" value="ÿ" /> + <ngram occurrences="52" value="ç" /> + <ngram occurrences="52" value="â" /> + <ngram occurrences="52" value="µä_" /> + <ngram occurrences="52" value="µä" /> + <ngram occurrences="52" value="_µä_" /> + <ngram occurrences="52" value="_µä" /> + <ngram occurrences="51" value="ñ" /> + <ngram occurrences="51" value="_á" /> + <ngram occurrences="50" value="½_" /> + <ngram occurrences="49" value="ø" /> + <ngram occurrences="49" value="¹_" /> + <ngram occurrences="49" value="³" /> + <ngram occurrences="45" value="ì" /> + <ngram occurrences="44" value="_î" /> + <ngram occurrences="43" value="_è" /> + <ngram occurrences="40" value="µ_" /> + <ngram occurrences="40" value="_ê" /> + <ngram occurrences="40" value="_²" /> + <ngram occurrences="39" value="_ô" /> + <ngram occurrences="38" value="¸_" /> + <ngram occurrences="38" value="ê_" /> + <ngram occurrences="38" value="_õ" /> + <ngram occurrences="37" value="å" /> + <ngram occurrences="37" value="º" /> + <ngram occurrences="35" value="ð_" /> + <ngram occurrences="35" value="í_" /> + <ngram occurrences="35" value="_ó" /> + <ngram occurrences="34" value="æ" /> + <ngram occurrences="34" value="²_" /> + <ngram occurrences="34" value="_ò" /> + <ngram occurrences="34" value="_é" /> + <ngram occurrences="33" value="î_" /> + <ngram occurrences="33" value="ª" /> + <ngram occurrences="33" value="_ÿ" /> + <ngram occurrences="33" value="_à" /> + <ngram occurrences="32" value="¨" /> + <ngram occurrences="32" value="_¹_" /> + <ngram occurrences="31" value="ï_" /> + <ngram occurrences="31" value="ç_" /> + <ngram occurrences="31" value="_ë" /> + <ngram occurrences="30" value="ù" /> + <ngram occurrences="28" value="ü" /> + <ngram occurrences="28" value="ø_" /> + <ngram occurrences="28" value="ñ_" /> + <ngram occurrences="27" value="â_" /> + <ngram occurrences="27" value="¹ú" /> + <ngram occurrences="27" value="_í" /> + <ngram occurrences="26" value="è_" /> + <ngram occurrences="26" value="ª_" /> + <ngram occurrences="25" value="ý" /> + <ngram occurrences="25" value="û" /> + <ngram occurrences="25" value="ó_" /> + <ngram occurrences="25" value="ò_" /> + <ngram occurrences="25" value="é_" /> + <ngram occurrences="25" value="à_" /> + <ngram occurrences="25" value="_ï" /> + <ngram occurrences="24" value="_ö_" /> + <ngram occurrences="24" value="_ä" /> + <ngram occurrences="24" value="_²_" /> + <ngram occurrences="23" value="õ_" /> + <ngram occurrences="23" value="å_" /> + <ngram occurrences="23" value="áë_" /> + <ngram occurrences="23" value="áë" /> + <ngram occurrences="23" value="_º" /> + <ngram occurrences="22" value="ù_" /> + <ngram occurrences="22" value="_ð" /> + <ngram occurrences="22" value="_ì" /> + <ngram occurrences="22" value="_µ_" /> + <ngram occurrences="21" value="ô_" /> + <ngram occurrences="21" value="_¸_" /> + <ngram occurrences="21" value="_ã" /> + <ngram occurrences="21" value="_áë_" /> + <ngram occurrences="21" value="_áë" /> + <ngram occurrences="20" value="þ" /> + <ngram occurrences="20" value="ôú" /> + <ngram occurrences="20" value="äê" /> + <ngram occurrences="20" value="ã_" /> + <ngram occurrences="20" value="³_" /> + <ngram occurrences="20" value="_æ" /> + <ngram occurrences="20" value="_³" /> + <ngram occurrences="19" value="ôú_" /> + <ngram occurrences="19" value="¹ú_" /> + <ngram occurrences="18" value="¨_" /> + <ngram occurrences="18" value="ý_" /> + <ngram occurrences="17" value="_ôú" /> + <ngram occurrences="17" value="_ê_" /> + <ngram occurrences="16" value="ÿ_" /> + <ngram occurrences="16" value="ðð" /> + <ngram occurrences="16" value="ì_" /> + <ngram occurrences="16" value="_ôú_" /> + <ngram occurrences="16" value="_ñ" /> + <ngram occurrences="16" value="_å" /> + <ngram occurrences="15" value="û_" /> + <ngram occurrences="15" value="_à_" /> + <ngram occurrences="14" value="ü_" /> + <ngram occurrences="14" value="èë" /> + <ngram occurrences="14" value="_½_" /> + <ngram occurrences="14" value="_äê" /> + <ngram occurrences="13" value="æ_" /> + <ngram occurrences="13" value="äê_" /> + <ngram occurrences="13" value="á_" /> + <ngram occurrences="13" value="_ç" /> + <ngram occurrences="12" value="³ö_" /> + <ngram occurrences="12" value="³ö" /> + <ngram occurrences="12" value="_î_" /> + <ngram occurrences="12" value="_è_" /> + <ngram occurrences="11" value="¸ó" /> + <ngram occurrences="11" value="öð" /> + <ngram occurrences="11" value="ðð_" /> + <ngram occurrences="11" value="ºí" /> + <ngram occurrences="11" value="µ½_" /> + <ngram occurrences="11" value="µ½" /> + <ngram occurrences="11" value="_¨" /> + <ngram occurrences="11" value="_ó_" /> + <ngram occurrences="11" value="_å_" /> + <ngram occurrences="11" value="_¹ú" /> + <ngram occurrences="10" value="õþ" /> + <ngram occurrences="10" value="éï" /> + <ngram occurrences="10" value="ãñ" /> + <ngram occurrences="10" value="ºí_" /> + <ngram occurrences="10" value="º_" /> + <ngram occurrences="10" value="_ù_" /> + <ngram occurrences="10" value="_ù" /> + <ngram occurrences="10" value="_öð" /> + <ngram occurrences="10" value="_ë_" /> + <ngram occurrences="10" value="_äê_" /> + <ngram occurrences="10" value="_ºí_" /> + <ngram occurrences="10" value="_ºí" /> + <ngram occurrences="10" value="_ª" /> + <ngram occurrences="9" value="½¨" /> + <ngram occurrences="9" value="½ø" /> + <ngram occurrences="9" value="õâ" /> + <ngram occurrences="9" value="ãç_" /> + <ngram occurrences="9" value="ãç" /> + <ngram occurrences="9" value="ß" /> + <ngram occurrences="9" value="_¸ó" /> + <ngram occurrences="9" value="_ú" /> + <ngram occurrences="9" value="_ô_" /> + <ngram occurrences="9" value="_éï" /> + <ngram occurrences="9" value="_â" /> + <ngram occurrences="9" value="_ª_" /> + <ngram occurrences="8" value="¸ö" /> + <ngram occurrences="8" value="ÿü" /> + <ngram occurrences="8" value="ÿù" /> + <ngram occurrences="8" value="àí" /> + <ngram occurrences="8" value="ß_" /> + <ngram occurrences="8" value="µø" /> + <ngram occurrences="8" value="µã" /> + <ngram occurrences="8" value="²ú" /> + <ngram occurrences="8" value="_½¨" /> + <ngram occurrences="8" value="_ÿù" /> + <ngram occurrences="8" value="_ÿ_" /> + <ngram occurrences="8" value="_õþ" /> + <ngram occurrences="8" value="_õâ" /> + <ngram occurrences="8" value="_ï_" /> + <ngram occurrences="7" value="¸ö_" /> + <ngram occurrences="7" value="½_¹" /> + <ngram occurrences="7" value="½_µ" /> + <ngram occurrences="7" value="ÿö" /> + <ngram occurrences="7" value="þ_" /> + <ngram occurrences="7" value="øð" /> + <ngram occurrences="7" value="òµ" /> + <ngram occurrences="7" value="îä" /> + <ngram occurrences="7" value="êõ" /> + <ngram occurrences="7" value="éï_" /> + <ngram occurrences="7" value="èõ" /> + <ngram occurrences="7" value="èë_" /> + <ngram occurrences="7" value="ãñ_" /> + <ngram occurrences="7" value="à¸_" /> + <ngram occurrences="7" value="à¸" /> + <ngram occurrences="7" value="¹ø" /> + <ngram occurrences="7" value="¹_µ" /> + <ngram occurrences="7" value="_¨_" /> + <ngram occurrences="7" value="_½ø" /> + <ngram occurrences="7" value="_ò_" /> + <ngram occurrences="7" value="_ñ_" /> + <ngram occurrences="7" value="_îä" /> + <ngram occurrences="7" value="_ì_" /> + <ngram occurrences="7" value="_èõ" /> + <ngram occurrences="7" value="_èë" /> + <ngram occurrences="7" value="_µã" /> + <ngram occurrences="7" value="_³ö_" /> + <ngram occurrences="7" value="_³ö" /> + <ngram occurrences="7" value="_³_" /> + <ngram occurrences="6" value="¸ó_" /> + <ngram occurrences="6" value="½½" /> + <ngram occurrences="6" value="½ü" /> + <ngram occurrences="6" value="ú½" /> + <ngram occurrences="6" value="ú_¸" /> + <ngram occurrences="6" value="ö_ö" /> + <ngram occurrences="6" value="ö_¹" /> + <ngram occurrences="6" value="ö_µ" /> + <ngram occurrences="6" value="õâ_" /> + <ngram occurrences="6" value="õ¹" /> + <ngram occurrences="6" value="òé_" /> + <ngram occurrences="6" value="òé" /> + <ngram occurrences="6" value="òµ_" /> + <ngram occurrences="6" value="ð_µ" /> + <ngram occurrences="6" value="îò" /> + <ngram occurrences="6" value="îê" /> + <ngram occurrences="6" value="íò_" /> + <ngram occurrences="6" value="íò" /> + <ngram occurrences="6" value="ëû" /> + <ngram occurrences="6" value="ë_½" /> + <ngram occurrences="6" value="ê_µ" /> + <ngram occurrences="6" value="èõ_" /> + <ngram occurrences="6" value="ä_½" /> + <ngram occurrences="6" value="àí_" /> + <ngram occurrences="6" value="¹²" /> + <ngram occurrences="6" value="µø_" /> + <ngram occurrences="6" value="µ_¸" /> + <ngram occurrences="6" value="_¸ö" /> + <ngram occurrences="6" value="_ú_" /> + <ngram occurrences="6" value="_îò" /> + <ngram occurrences="6" value="_íò_" /> + <ngram occurrences="6" value="_íò" /> + <ngram occurrences="6" value="_í_" /> + <ngram occurrences="6" value="_ëû" /> + <ngram occurrences="6" value="_éï_" /> + <ngram occurrences="6" value="_èõ_" /> + <ngram occurrences="6" value="_¹²" /> + <ngram occurrences="6" value="_µ½_" /> + <ngram occurrences="6" value="_µ½" /> + <ngram occurrences="6" value="_µø" /> + <ngram occurrences="5" value="½¸_" /> + <ngram occurrences="5" value="½¸" /> + <ngram occurrences="5" value="½ê" /> + <ngram occurrences="5" value="ÿö_" /> + <ngram occurrences="5" value="ú_µ" /> + <ngram occurrences="5" value="øðð" /> + <ngram occurrences="5" value="öî_" /> + <ngram occurrences="5" value="öî" /> + <ngram occurrences="5" value="ö_ö_" /> + <ngram occurrences="5" value="ô½_" /> + <ngram occurrences="5" value="ô½" /> + <ngram occurrences="5" value="óú" /> + <ngram occurrences="5" value="óð_" /> + <ngram occurrences="5" value="óð" /> + <ngram occurrences="5" value="óã" /> + <ngram occurrences="5" value="ðô" /> + <ngram occurrences="5" value="ðâ" /> + <ngram occurrences="5" value="ð_á" /> + <ngram occurrences="5" value="ïµ" /> + <ngram occurrences="5" value="ï_½" /> + <ngram occurrences="5" value="ìâ_" /> + <ngram occurrences="5" value="ìâ" /> + <ngram occurrences="5" value="ìá" /> + <ngram occurrences="5" value="ì_µ" /> + <ngram occurrences="5" value="ë_õ" /> + <ngram occurrences="5" value="êç" /> + <ngram occurrences="5" value="êâ" /> + <ngram occurrences="5" value="êà" /> + <ngram occurrences="5" value="êµ" /> + <ngram occurrences="5" value="éú" /> + <ngram occurrences="5" value="çø_" /> + <ngram occurrences="5" value="çø" /> + <ngram occurrences="5" value="ä_ö" /> + <ngram occurrences="5" value="ä_é" /> + <ngram occurrences="5" value="ä_¹" /> + <ngram occurrences="5" value="á¨_" /> + <ngram occurrences="5" value="á¨" /> + <ngram occurrences="5" value="áª" /> + <ngram occurrences="5" value="ºï" /> + <ngram occurrences="5" value="¹ý" /> + <ngram occurrences="5" value="¹_¸" /> + <ngram occurrences="5" value="µä_¹" /> + <ngram occurrences="5" value="µã_" /> + <ngram occurrences="5" value="³é" /> + <ngram occurrences="5" value="_¸ö_" /> + <ngram occurrences="5" value="_½¸_" /> + <ngram occurrences="5" value="_½¸" /> + <ngram occurrences="5" value="_½½" /> + <ngram occurrences="5" value="_ÿü" /> + <ngram occurrences="5" value="_ö_ö" /> + <ngram occurrences="5" value="_ö_¹" /> + <ngram occurrences="5" value="_õâ_" /> + <ngram occurrences="5" value="_ðâ" /> + <ngram occurrences="5" value="_ð_" /> + <ngram occurrences="5" value="_îê" /> + <ngram occurrences="5" value="_ìá" /> + <ngram occurrences="5" value="_ãñ" /> + <ngram occurrences="5" value="_ã_" /> + <ngram occurrences="5" value="_á_" /> + <ngram occurrences="5" value="_¹ý" /> + <ngram occurrences="5" value="_¹ø" /> + <ngram occurrences="5" value="_¹_¸" /> + <ngram occurrences="5" value="_µø_" /> + <ngram occurrences="5" value="_µä_¹" /> + <ngram occurrences="5" value="_²ú" /> + <ngram occurrences="4" value="¸ï" /> + <ngram occurrences="4" value="¸_ö" /> + <ngram occurrences="4" value="¸_í" /> + <ngram occurrences="4" value="¸_¹" /> + <ngram occurrences="4" value="¸_µ" /> + <ngram occurrences="4" value="½û" /> + <ngram occurrences="4" value="½øðð_" /> + <ngram occurrences="4" value="½øðð" /> + <ngram occurrences="4" value="½øð" /> + <ngram occurrences="4" value="½ò" /> + <ngram occurrences="4" value="½ì" /> + <ngram occurrences="4" value="½ç" /> + <ngram occurrences="4" value="½æ" /> + <ngram occurrences="4" value="½ä" /> + <ngram occurrences="4" value="½â" /> + <ngram occurrences="4" value="½_õ" /> + <ngram occurrences="4" value="½_µä_" /> + <ngram occurrences="4" value="½_µä" /> + <ngram occurrences="4" value="ÿí_" /> + <ngram occurrences="4" value="ÿí" /> + <ngram occurrences="4" value="ÿ_½" /> + <ngram occurrences="4" value="þöî_" /> + <ngram occurrences="4" value="þöî" /> + <ngram occurrences="4" value="þö" /> + <ngram occurrences="4" value="þ²" /> + <ngram occurrences="4" value="û_ë" /> + <ngram occurrences="4" value="ú¹" /> + <ngram occurrences="4" value="ú_õ" /> + <ngram occurrences="4" value="ú_î" /> + <ngram occurrences="4" value="ú_í" /> + <ngram occurrences="4" value="ú_²" /> + <ngram occurrences="4" value="ù_ö_ö" /> + <ngram occurrences="4" value="ù_ö_" /> + <ngram occurrences="4" value="ù_ö" /> + <ngram occurrences="4" value="øðð_" /> + <ngram occurrences="4" value="ø_ÿ" /> + <ngram occurrences="4" value="öø" /> + <ngram occurrences="4" value="öðð" /> + <ngram occurrences="4" value="öð_" /> + <ngram occurrences="4" value="ö_ò" /> + <ngram occurrences="4" value="ö_á" /> + <ngram occurrences="4" value="ö_¹_" /> + <ngram occurrences="4" value="õ½" /> + <ngram occurrences="4" value="õþöî_" /> + <ngram occurrences="4" value="õþöî" /> + <ngram occurrences="4" value="õþö" /> + <ngram occurrences="4" value="õ¹_" /> + <ngram occurrences="4" value="ôª_" /> + <ngram occurrences="4" value="ôª" /> + <ngram occurrences="4" value="óú_" /> + <ngram occurrences="4" value="óª" /> + <ngram occurrences="4" value="ó_¹" /> + <ngram occurrences="4" value="òñ_" /> + <ngram occurrences="4" value="òñ" /> + <ngram occurrences="4" value="òª_" /> + <ngram occurrences="4" value="òª" /> + <ngram occurrences="4" value="ñ_µä_" /> + <ngram occurrences="4" value="ñ_µä" /> + <ngram occurrences="4" value="ñ_µ" /> + <ngram occurrences="4" value="ð_áë_" /> + <ngram occurrences="4" value="ð_áë" /> + <ngram occurrences="4" value="ïø_" /> + <ngram occurrences="4" value="ïø" /> + <ngram occurrences="4" value="îêìâ_" /> + <ngram occurrences="4" value="îêìâ" /> + <ngram occurrences="4" value="îêì" /> + <ngram occurrences="4" value="îä_" /> + <ngram occurrences="4" value="îª_" /> + <ngram occurrences="4" value="îª" /> + <ngram occurrences="4" value="í_½" /> + <ngram occurrences="4" value="ìõ" /> + <ngram occurrences="4" value="ëû_" /> + <ngram occurrences="4" value="ëã" /> + <ngram occurrences="4" value="ëµ_" /> + <ngram occurrences="4" value="ëµ" /> + <ngram occurrences="4" value="ë_ê" /> + <ngram occurrences="4" value="ë_é" /> +</ngrams> diff --git a/src/plugins/language/croatian.klp b/src/plugins/language/croatian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="782" value="_" /> + <ngram occurrences="425" value="o" /> + <ngram occurrences="417" value="a" /> + <ngram occurrences="363" value="e" /> + <ngram occurrences="335" value="i" /> + <ngram occurrences="258" value="n" /> + <ngram occurrences="230" value="s" /> + <ngram occurrences="229" value="j" /> + <ngram occurrences="186" value="t" /> + <ngram occurrences="174" value="u" /> + <ngram occurrences="161" value="r" /> + <ngram occurrences="156" value="l" /> + <ngram occurrences="155" value="e_" /> + <ngram occurrences="152" value="je" /> + <ngram occurrences="151" value="k" /> + <ngram occurrences="150" value="a_" /> + <ngram occurrences="149" value="o_" /> + <ngram occurrences="140" value="d" /> + <ngram occurrences="137" value="m" /> + <ngram occurrences="132" value="v" /> + <ngram occurrences="105" value="p" /> + <ngram occurrences="99" value="_s" /> + <ngram occurrences="91" value="y" /> + <ngram occurrences="91" value="i_" /> + <ngram occurrences="85" value="z" /> + <ngram occurrences="83" value="je_" /> + <ngram occurrences="79" value="u_" /> + <ngram occurrences="74" value="_n" /> + <ngram occurrences="73" value="g" /> + <ngram occurrences="67" value="c" /> + <ngram occurrences="66" value="_p" /> + <ngram occurrences="64" value="b" /> + <ngram occurrences="61" value="_d" /> + <ngram occurrences="60" value="_j" /> + <ngram occurrences="59" value="st" /> + <ngram occurrences="57" value="_je" /> + <ngram occurrences="53" value="ne" /> + <ngram occurrences="53" value="_je_" /> + <ngram occurrences="51" value="ko" /> + <ngram occurrences="47" value="da" /> + <ngram occurrences="47" value="_o" /> + <ngram occurrences="46" value="no" /> + <ngram occurrences="46" value="_i" /> + <ngram occurrences="44" value="_k" /> + <ngram occurrences="41" value="to" /> + <ngram occurrences="39" value="ni" /> + <ngram occurrences="39" value="ja" /> + <ngram occurrences="39" value="ij" /> + <ngram occurrences="37" value="na" /> + <ngram occurrences="36" value="ta" /> + <ngram occurrences="36" value="ka" /> + <ngram occurrences="36" value="an" /> + <ngram occurrences="35" value="ra" /> + <ngram occurrences="35" value="lo" /> + <ngram occurrences="35" value="ak" /> + <ngram occurrences="35" value="_u" /> + <ngram occurrences="34" value="sy" /> + <ngram occurrences="34" value="_m" /> + <ngram occurrences="33" value="m_" /> + <ngram occurrences="32" value="ti" /> + <ngram occurrences="32" value="ije" /> + <ngram occurrences="32" value="da_" /> + <ngram occurrences="32" value="_ne" /> + <ngram occurrences="31" value="li" /> + <ngram occurrences="30" value="pr" /> + <ngram occurrences="30" value="is" /> + <ngram occurrences="30" value="en" /> + <ngram occurrences="29" value="vo" /> + <ngram occurrences="29" value="po" /> + <ngram occurrences="29" value="ov" /> + <ngram occurrences="29" value="in" /> + <ngram occurrences="29" value="cy" /> + <ngram occurrences="29" value="_z" /> + <ngram occurrences="29" value="_t" /> + <ngram occurrences="29" value="_da" /> + <ngram occurrences="29" value="_b" /> + <ngram occurrences="28" value="os" /> + <ngram occurrences="28" value="al" /> + <ngram occurrences="28" value="_g" /> + <ngram occurrences="27" value="zy" /> + <ngram occurrences="27" value="im" /> + <ngram occurrences="27" value="_pr" /> + <ngram occurrences="26" value="vi" /> + <ngram occurrences="26" value="va" /> + <ngram occurrences="26" value="om" /> + <ngram occurrences="26" value="bi" /> + <ngram occurrences="25" value="ri" /> + <ngram occurrences="25" value="on" /> + <ngram occurrences="25" value="lj" /> + <ngram occurrences="25" value="la" /> + <ngram occurrences="25" value="ek" /> + <ngram occurrences="25" value="ao" /> + <ngram occurrences="24" value="ma" /> + <ngram occurrences="24" value="ko_" /> + <ngram occurrences="24" value="es" /> + <ngram occurrences="23" value="ya" /> + <ngram occurrences="23" value="re" /> + <ngram occurrences="23" value="og" /> + <ngram occurrences="23" value="ne_" /> + <ngram occurrences="23" value="ao_" /> + <ngram occurrences="23" value="a_s" /> + <ngram occurrences="23" value="_da_" /> + <ngram occurrences="23" value="_c" /> + <ngram occurrences="22" value="oj" /> + <ngram occurrences="22" value="no_" /> + <ngram occurrences="22" value="na_" /> + <ngram occurrences="22" value="at" /> + <ngram occurrences="22" value="_i_" /> + <ngram occurrences="21" value="se" /> + <ngram occurrences="21" value="or" /> + <ngram occurrences="21" value="le" /> + <ngram occurrences="21" value="il" /> + <ngram occurrences="21" value="go" /> + <ngram occurrences="21" value="av" /> + <ngram occurrences="20" value="za" /> + <ngram occurrences="20" value="sa" /> + <ngram occurrences="20" value="ol" /> + <ngram occurrences="20" value="lo_" /> + <ngram occurrences="20" value="k_" /> + <ngram occurrences="20" value="et" /> + <ngram occurrences="20" value="_po" /> + <ngram occurrences="20" value="_ka" /> + <ngram occurrences="19" value="ve" /> + <ngram occurrences="19" value="sto" /> + <ngram occurrences="19" value="o_s" /> + <ngram occurrences="19" value="o_je_" /> + <ngram occurrences="19" value="o_je" /> + <ngram occurrences="19" value="o_j" /> + <ngram occurrences="19" value="nu" /> + <ngram occurrences="19" value="ad" /> + <ngram occurrences="19" value="_v" /> + <ngram occurrences="19" value="_u_" /> + <ngram occurrences="18" value="te" /> + <ngram occurrences="18" value="ru" /> + <ngram occurrences="18" value="ro" /> + <ngram occurrences="18" value="iz" /> + <ngram occurrences="18" value="e_p" /> + <ngram occurrences="18" value="_se" /> + <ngram occurrences="18" value="_bi" /> + <ngram occurrences="17" value="ti_" /> + <ngram occurrences="17" value="se_" /> + <ngram occurrences="17" value="od" /> + <ngram occurrences="17" value="nj" /> + <ngram occurrences="17" value="h" /> + <ngram occurrences="17" value="g_" /> + <ngram occurrences="17" value="e_n" /> + <ngram occurrences="17" value="ar" /> + <ngram occurrences="17" value="_st" /> + <ngram occurrences="17" value="_cy" /> + <ngram occurrences="16" value="to_" /> + <ngram occurrences="16" value="ok" /> + <ngram occurrences="16" value="mi" /> + <ngram occurrences="16" value="ed" /> + <ngram occurrences="16" value="do" /> + <ngram occurrences="16" value="am" /> + <ngram occurrences="16" value="_se_" /> + <ngram occurrences="16" value="_na" /> + <ngram occurrences="16" value="_ko" /> + <ngram occurrences="16" value="_a" /> + <ngram occurrences="15" value="yi" /> + <ngram occurrences="15" value="om_" /> + <ngram occurrences="15" value="ob" /> + <ngram occurrences="15" value="ns" /> + <ngram occurrences="15" value="n_" /> + <ngram occurrences="15" value="mo" /> + <ngram occurrences="15" value="lje" /> + <ngram occurrences="15" value="kak" /> + <ngram occurrences="15" value="ije_" /> + <ngram occurrences="15" value="el" /> + <ngram occurrences="15" value="e_s" /> + <ngram occurrences="15" value="ako" /> + <ngram occurrences="15" value="_ni" /> + <ngram occurrences="15" value="_l" /> + <ngram occurrences="14" value="su" /> + <ngram occurrences="14" value="sta" /> + <ngram occurrences="14" value="og_" /> + <ngram occurrences="14" value="o_n" /> + <ngram occurrences="14" value="kr" /> + <ngram occurrences="14" value="ja_" /> + <ngram occurrences="14" value="ic" /> + <ngram occurrences="14" value="di" /> + <ngram occurrences="14" value="cj" /> + <ngram occurrences="14" value="bil" /> + <ngram occurrences="14" value="_za" /> + <ngram occurrences="13" value="u_p" /> + <ngram occurrences="13" value="sv" /> + <ngram occurrences="13" value="o_d" /> + <ngram occurrences="13" value="ma_" /> + <ngram occurrences="13" value="je_n" /> + <ngram occurrences="13" value="ins" /> + <ngram occurrences="13" value="im_" /> + <ngram occurrences="13" value="em" /> + <ngram occurrences="13" value="a_j" /> + <ngram occurrences="12" value="uz" /> + <ngram occurrences="12" value="su_" /> + <ngram occurrences="12" value="sl" /> + <ngram occurrences="12" value="pa" /> + <ngram occurrences="12" value="nst" /> + <ngram occurrences="12" value="me" /> + <ngram occurrences="12" value="koj" /> + <ngram occurrences="12" value="it" /> + <ngram occurrences="12" value="io" /> + <ngram occurrences="12" value="gl" /> + <ngram occurrences="12" value="ako_" /> + <ngram occurrences="12" value="aj" /> + <ngram occurrences="12" value="a_n" /> + <ngram occurrences="12" value="a_je" /> + <ngram occurrences="12" value="_sv" /> + <ngram occurrences="12" value="_su" /> + <ngram occurrences="12" value="_r" /> + <ngram occurrences="12" value="_na_" /> + <ngram occurrences="12" value="_bil" /> + <ngram occurrences="11" value="yt" /> + <ngram occurrences="11" value="tr" /> + <ngram occurrences="11" value="syt" /> + <ngram occurrences="11" value="sk" /> + <ngram occurrences="11" value="ran" /> + <ngram occurrences="11" value="o_p" /> + <ngram occurrences="11" value="o_k" /> + <ngram occurrences="11" value="mu" /> + <ngram occurrences="11" value="li_" /> + <ngram occurrences="11" value="ju" /> + <ngram occurrences="11" value="inst" /> + <ngram occurrences="11" value="ima" /> + <ngram occurrences="11" value="ga" /> + <ngram occurrences="11" value="ev" /> + <ngram occurrences="11" value="e_o" /> + <ngram occurrences="11" value="a_k" /> + <ngram occurrences="11" value="a_je_" /> + <ngram occurrences="11" value="_sa" /> + <ngram occurrences="11" value="_koj" /> + <ngram occurrences="11" value="_do" /> + <ngram occurrences="10" value="za_" /> + <ngram occurrences="10" value="winst" /> + <ngram occurrences="10" value="wins" /> + <ngram occurrences="10" value="win" /> + <ngram occurrences="10" value="wi" /> + <ngram occurrences="10" value="w" /> + <ngram occurrences="10" value="ton" /> + <ngram occurrences="10" value="tn" /> + <ngram occurrences="10" value="ston" /> + <ngram occurrences="10" value="pri" /> + <ngram occurrences="10" value="on_" /> + <ngram occurrences="10" value="nston" /> + <ngram occurrences="10" value="nsto" /> + <ngram occurrences="10" value="ni_" /> + <ngram occurrences="10" value="la_" /> + <ngram occurrences="10" value="jes" /> + <ngram occurrences="10" value="je_p" /> + <ngram occurrences="10" value="j_" /> + <ngram occurrences="10" value="io_" /> + <ngram occurrences="10" value="insto" /> + <ngram occurrences="10" value="ilo" /> + <ngram occurrences="10" value="i_s" /> + <ngram occurrences="10" value="i_n" /> + <ngram occurrences="10" value="i_i" /> + <ngram occurrences="10" value="h_" /> + <ngram occurrences="10" value="e_po" /> + <ngram occurrences="10" value="e_ne" /> + <ngram occurrences="10" value="e_d" /> + <ngram occurrences="10" value="dr" /> + <ngram occurrences="10" value="dj" /> + <ngram occurrences="10" value="d_" /> + <ngram occurrences="10" value="as" /> + <ngram occurrences="10" value="a_d" /> + <ngram occurrences="10" value="_wins" /> + <ngram occurrences="10" value="_win" /> + <ngram occurrences="10" value="_wi" /> + <ngram occurrences="10" value="_w" /> + <ngram occurrences="10" value="_su_" /> + <ngram occurrences="10" value="_pri" /> + <ngram occurrences="10" value="_os" /> + <ngram occurrences="10" value="_iz" /> + <ngram occurrences="10" value="_go" /> + <ngram occurrences="9" value="ye" /> + <ngram occurrences="9" value="vo_" /> + <ngram occurrences="9" value="vje" /> + <ngram occurrences="9" value="vj" /> + <ngram occurrences="9" value="vij" /> + <ngram occurrences="9" value="ur" /> + <ngram occurrences="9" value="tv" /> + <ngram occurrences="9" value="tu" /> + <ngram occurrences="9" value="ton_" /> + <ngram occurrences="9" value="ta_" /> + <ngram occurrences="9" value="ston_" /> + <ngram occurrences="9" value="sti" /> + <ngram occurrences="9" value="so" /> + <ngram occurrences="9" value="rn" /> + <ngram occurrences="9" value="r_" /> + <ngram occurrences="9" value="pre" /> + <ngram occurrences="9" value="pi" /> + <ngram occurrences="9" value="ost" /> + <ngram occurrences="9" value="o_m" /> + <ngram occurrences="9" value="nu_" /> + <ngram occurrences="9" value="nt" /> + <ngram occurrences="9" value="nje" /> + <ngram occurrences="9" value="mje" /> + <ngram occurrences="9" value="mj" /> + <ngram occurrences="9" value="lu" /> + <ngram occurrences="9" value="ku" /> + <ngram occurrences="9" value="kako_" /> + <ngram occurrences="9" value="kako" /> + <ngram occurrences="9" value="ji" /> + <ngram occurrences="9" value="jen" /> + <ngram occurrences="9" value="ilo_" /> + <ngram occurrences="9" value="i_d" /> + <ngram occurrences="9" value="est" /> + <ngram occurrences="9" value="er" /> + <ngram occurrences="9" value="ec" /> + <ngram occurrences="9" value="e_t" /> + <ngram occurrences="9" value="cya" /> + <ngram occurrences="9" value="ci" /> + <ngram occurrences="9" value="ce" /> + <ngram occurrences="9" value="a_i" /> + <ngram occurrences="9" value="_zy" /> + <ngram occurrences="9" value="_te" /> + <ngram occurrences="9" value="_mu" /> + <ngram occurrences="9" value="_mo" /> + <ngram occurrences="8" value="zm" /> + <ngram occurrences="8" value="yto_" /> + <ngram occurrences="8" value="yto" /> + <ngram occurrences="8" value="va_" /> + <ngram occurrences="8" value="ut" /> + <ngram occurrences="8" value="u_s" /> + <ngram occurrences="8" value="u_je" /> + <ngram occurrences="8" value="u_j" /> + <ngram occurrences="8" value="syto_" /> + <ngram occurrences="8" value="syto" /> + <ngram occurrences="8" value="sp" /> + <ngram occurrences="8" value="si" /> + <ngram occurrences="8" value="s_" /> + <ngram occurrences="8" value="rij" /> + <ngram occurrences="8" value="nov" /> + <ngram occurrences="8" value="nij" /> + <ngram occurrences="8" value="mu_" /> + <ngram occurrences="8" value="lic" /> + <ngram occurrences="8" value="ju_" /> + <ngram occurrences="8" value="jek_" /> + <ngram occurrences="8" value="jek" /> + <ngram occurrences="8" value="je_ne" /> + <ngram occurrences="8" value="ih_" /> + <ngram occurrences="8" value="ih" /> + <ngram occurrences="8" value="ez" /> + <ngram occurrences="8" value="esy" /> + <ngram occurrences="8" value="ek_" /> + <ngram occurrences="8" value="eg" /> + <ngram occurrences="8" value="ecj" /> + <ngram occurrences="8" value="e_u" /> + <ngram occurrences="8" value="e_m" /> + <ngram occurrences="8" value="bo" /> + <ngram occurrences="8" value="bilo_" /> + <ngram occurrences="8" value="bilo" /> + <ngram occurrences="8" value="ali" /> + <ngram occurrences="8" value="ak_" /> + <ngram occurrences="8" value="a_o" /> + <ngram occurrences="8" value="a_g" /> + <ngram occurrences="8" value="_to" /> + <ngram occurrences="8" value="_pre" /> + <ngram occurrences="8" value="_kak" /> + <ngram occurrences="8" value="_je_n" /> + <ngram occurrences="8" value="_bilo" /> + <ngram occurrences="7" value="zyi" /> + <ngram occurrences="7" value="zya" /> + <ngram occurrences="7" value="yn" /> + <ngram occurrences="7" value="y_" /> + <ngram occurrences="7" value="vor" /> + <ngram occurrences="7" value="vije" /> + <ngram occurrences="7" value="ve_" /> + <ngram occurrences="7" value="uzy" /> + <ngram occurrences="7" value="up" /> + <ngram occurrences="7" value="ug" /> + <ngram occurrences="7" value="ud" /> + <ngram occurrences="7" value="uc" /> + <ngram occurrences="7" value="u_pr" /> + <ngram occurrences="7" value="u_k" /> + <ngram occurrences="7" value="u_je_" /> + <ngram occurrences="7" value="u_c" /> + <ngram occurrences="7" value="t_" /> + <ngram occurrences="7" value="sya" /> + <ngram occurrences="7" value="pro" /> + <ngram occurrences="7" value="pl" /> + <ngram occurrences="7" value="oz" /> + <ngram occurrences="7" value="ovo" /> + <ngram occurrences="7" value="ot" /> + <ngram occurrences="7" value="op" /> + <ngram occurrences="7" value="olje" /> + <ngram occurrences="7" value="olj" /> + <ngram occurrences="7" value="oc" /> + <ngram occurrences="7" value="o_u" /> + <ngram occurrences="7" value="o_ka" /> + <ngram occurrences="7" value="o_da" /> + <ngram occurrences="7" value="nim" /> + <ngram occurrences="7" value="nije_" /> + <ngram occurrences="7" value="nije" /> + <ngram occurrences="7" value="nes" /> + <ngram occurrences="7" value="nek" /> + <ngram occurrences="7" value="mis" /> + <ngram occurrences="7" value="m_d" /> + <ngram occurrences="7" value="lja" /> + <ngram occurrences="7" value="ki" /> +</ngrams> diff --git a/src/plugins/language/czech.klp b/src/plugins/language/czech.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="732" value="_" /> + <ngram occurrences="352" value="o" /> + <ngram occurrences="300" value="a" /> + <ngram occurrences="278" value="e" /> + <ngram occurrences="250" value="n" /> + <ngram occurrences="215" value="t" /> + <ngram occurrences="209" value="s" /> + <ngram occurrences="197" value="v" /> + <ngram occurrences="179" value="l" /> + <ngram occurrences="163" value="r" /> + <ngram occurrences="150" value="i" /> + <ngram occurrences="148" value="k" /> + <ngram occurrences="147" value="d" /> + <ngram occurrences="146" value="p" /> + <ngram occurrences="136" value="u" /> + <ngram occurrences="112" value="m" /> + <ngram occurrences="109" value="z" /> + <ngram occurrences="99" value="á" /> + <ngram occurrences="98" value="h" /> + <ngram occurrences="97" value="c" /> + <ngram occurrences="94" value="_p" /> + <ngram occurrences="92" value="í" /> + <ngram occurrences="87" value="a_" /> + <ngram occurrences="86" value="y" /> + <ngram occurrences="81" value="o_" /> + <ngram occurrences="79" value="_s" /> + <ngram occurrences="73" value="j" /> + <ngram occurrences="71" value="b" /> + <ngram occurrences="68" value="e_" /> + <ngram occurrences="67" value="_v" /> + <ngram occurrences="67" value="_n" /> + <ngram occurrences="65" value="ì" /> + <ngram occurrences="63" value="u_" /> + <ngram occurrences="56" value="é" /> + <ngram occurrences="52" value="ø" /> + <ngram occurrences="51" value="st" /> + <ngram occurrences="50" value="y_" /> + <ngram occurrences="50" value="_z" /> + <ngram occurrences="46" value="na" /> + <ngram occurrences="45" value="í_" /> + <ngram occurrences="45" value="è" /> + <ngram occurrences="44" value="ho" /> + <ngram occurrences="42" value="ov" /> + <ngram occurrences="41" value="pr" /> + <ngram occurrences="40" value="ra" /> + <ngram occurrences="39" value="ro" /> + <ngram occurrences="39" value="po" /> + <ngram occurrences="38" value="é_" /> + <ngram occurrences="38" value="m_" /> + <ngram occurrences="38" value="_a" /> + <ngram occurrences="36" value="ý" /> + <ngram occurrences="36" value="od" /> + <ngram occurrences="36" value="_d" /> + <ngram occurrences="35" value="ní" /> + <ngram occurrences="34" value="ÿ" /> + <ngram occurrences="34" value="sk" /> + <ngram occurrences="34" value="i_" /> + <ngram occurrences="34" value="ch" /> + <ngram occurrences="33" value="_j" /> + <ngram occurrences="32" value="ne" /> + <ngram occurrences="31" value="to" /> + <ngram occurrences="29" value="ou" /> + <ngram occurrences="29" value="lo" /> + <ngram occurrences="29" value="en" /> + <ngram occurrences="29" value="_o" /> + <ngram occurrences="29" value="_k" /> + <ngram occurrences="29" value="_b" /> + <ngram occurrences="28" value="_t" /> + <ngram occurrences="27" value="_pr" /> + <ngram occurrences="27" value="_po" /> + <ngram occurrences="26" value="¹" /> + <ngram occurrences="26" value="t_" /> + <ngram occurrences="26" value="l_" /> + <ngram occurrences="26" value="je" /> + <ngram occurrences="26" value="_na" /> + <ngram occurrences="25" value="va" /> + <ngram occurrences="25" value="te" /> + <ngram occurrences="25" value="ta" /> + <ngram occurrences="25" value="na_" /> + <ngram occurrences="24" value="øe" /> + <ngram occurrences="24" value="pø" /> + <ngram occurrences="24" value="os" /> + <ngram occurrences="24" value="le" /> + <ngram occurrences="24" value="la" /> + <ngram occurrences="24" value="at" /> + <ngram occurrences="24" value="_m" /> + <ngram occurrences="24" value="_a_" /> + <ngram occurrences="23" value="ké" /> + <ngram occurrences="23" value="ko" /> + <ngram occurrences="23" value="av" /> + <ngram occurrences="23" value="al" /> + <ngram occurrences="23" value="_ne" /> + <ngram occurrences="22" value="do" /> + <ngram occurrences="22" value="_r" /> + <ngram occurrences="22" value="_pø" /> + <ngram occurrences="21" value="ù" /> + <ngram occurrences="21" value="ì_" /> + <ngram occurrences="21" value="ho_" /> + <ngram occurrences="21" value="ed" /> + <ngram occurrences="21" value="ak" /> + <ngram occurrences="21" value="ad" /> + <ngram occurrences="20" value="za" /> + <ngram occurrences="20" value="v_" /> + <ngram occurrences="20" value="li" /> + <ngram occurrences="20" value="an" /> + <ngram occurrences="19" value="ze" /> + <ngram occurrences="19" value="vo" /> + <ngram occurrences="19" value="so" /> + <ngram occurrences="19" value="ní_" /> + <ngram occurrences="19" value="es" /> + <ngram occurrences="19" value="ce" /> + <ngram occurrences="18" value="ské" /> + <ngram occurrences="18" value="or" /> + <ngram occurrences="18" value="ob" /> + <ngram occurrences="18" value="nì" /> + <ngram occurrences="18" value="no" /> + <ngram occurrences="18" value="ej" /> + <ngram occurrences="18" value="_za" /> + <ngram occurrences="18" value="_v_" /> + <ngram occurrences="18" value="_je" /> + <ngram occurrences="17" value="to_" /> + <ngram occurrences="17" value="ti" /> + <ngram occurrences="17" value="k_" /> + <ngram occurrences="17" value="_è" /> + <ngram occurrences="17" value="_c" /> + <ngram occurrences="16" value="ÿe" /> + <ngram occurrences="16" value="ve" /> + <ngram occurrences="16" value="se" /> + <ngram occurrences="16" value="s_" /> + <ngram occurrences="16" value="pro" /> + <ngram occurrences="16" value="ka" /> + <ngram occurrences="16" value="il" /> + <ngram occurrences="16" value="_to" /> + <ngram occurrences="15" value="vy" /> + <ngram occurrences="15" value="sl" /> + <ngram occurrences="15" value="oz" /> + <ngram occurrences="15" value="ké_" /> + <ngram occurrences="15" value="it" /> + <ngram occurrences="15" value="h_" /> + <ngram occurrences="15" value="ez" /> + <ngram occurrences="15" value="dn" /> + <ngram occurrences="15" value="ch_" /> + <ngram occurrences="15" value="by" /> + <ngram occurrences="15" value="_na_" /> + <ngram occurrences="14" value="øi" /> + <ngram occurrences="14" value="ého_" /> + <ngram occurrences="14" value="ého" /> + <ngram occurrences="14" value="éh" /> + <ngram occurrences="14" value="vý" /> + <ngram occurrences="14" value="tu" /> + <ngram occurrences="14" value="ou_" /> + <ngram occurrences="14" value="ná" /> + <ngram occurrences="14" value="ni" /> + <ngram occurrences="14" value="lá" /> + <ngram occurrences="14" value="lo_" /> + <ngram occurrences="14" value="in" /> + <ngram occurrences="14" value="et" /> + <ngram occurrences="14" value="da" /> + <ngram occurrences="14" value="_se" /> + <ngram occurrences="14" value="_pro" /> + <ngram occurrences="14" value="_h" /> + <ngram occurrences="13" value="ý_" /> + <ngram occurrences="13" value="vì" /> + <ngram occurrences="13" value="tn" /> + <ngram occurrences="13" value="sv" /> + <ngram occurrences="13" value="rá" /> + <ngram occurrences="13" value="pøe" /> + <ngram occurrences="13" value="pra" /> + <ngram occurrences="13" value="mì" /> + <ngram occurrences="13" value="ic" /> + <ngram occurrences="13" value="el" /> + <ngram occurrences="13" value="as" /> + <ngram occurrences="13" value="_sv" /> + <ngram occurrences="13" value="_l" /> + <ngram occurrences="12" value="ím" /> + <ngram occurrences="12" value="èe" /> + <ngram occurrences="12" value="vé" /> + <ngram occurrences="12" value="se_" /> + <ngram occurrences="12" value="ot" /> + <ngram occurrences="12" value="ost" /> + <ngram occurrences="12" value="ol" /> + <ngram occurrences="12" value="o_s" /> + <ngram occurrences="12" value="né" /> + <ngram occurrences="12" value="la_" /> + <ngram occurrences="12" value="ku" /> + <ngram occurrences="12" value="g" /> + <ngram occurrences="12" value="er" /> + <ngram occurrences="12" value="em" /> + <ngram occurrences="12" value="bo" /> + <ngram occurrences="12" value="_so" /> + <ngram occurrences="12" value="_se_" /> + <ngram occurrences="12" value="_pøe" /> + <ngram occurrences="11" value="ÿe_" /> + <ngram occurrences="11" value="ìt" /> + <ngram occurrences="11" value="át" /> + <ngram occurrences="11" value="á_" /> + <ngram occurrences="11" value="tr" /> + <ngram occurrences="11" value="pod" /> + <ngram occurrences="11" value="om" /> + <ngram occurrences="11" value="o_p" /> + <ngram occurrences="11" value="o_n" /> + <ngram occurrences="11" value="mu" /> + <ngram occurrences="11" value="ky" /> + <ngram occurrences="11" value="je_" /> + <ngram occurrences="11" value="f" /> + <ngram occurrences="11" value="a_p" /> + <ngram occurrences="11" value="_st" /> + <ngram occurrences="11" value="_do" /> + <ngram occurrences="10" value="ÿ_" /> + <ngram occurrences="10" value="án" /> + <ngram occurrences="10" value="zá" /> + <ngram occurrences="10" value="ské_" /> + <ngram occurrences="10" value="ru" /> + <ngram occurrences="10" value="re" /> + <ngram occurrences="10" value="pøi" /> + <ngram occurrences="10" value="on" /> + <ngram occurrences="10" value="nì_" /> + <ngram occurrences="10" value="né_" /> + <ngram occurrences="10" value="nt" /> + <ngram occurrences="10" value="lu" /> + <ngram occurrences="10" value="ku_" /> + <ngram occurrences="10" value="ji" /> + <ngram occurrences="10" value="ik" /> + <ngram occurrences="10" value="a_v" /> + <ngram occurrences="10" value="a_s" /> + <ngram occurrences="10" value="_vy" /> + <ngram occurrences="10" value="_ro" /> + <ngram occurrences="10" value="_ko" /> + <ngram occurrences="10" value="_ho" /> + <ngram occurrences="10" value="_by" /> + <ngram occurrences="9" value="ù_" /> + <ngram occurrences="9" value="øed" /> + <ngram occurrences="9" value="íc" /> + <ngram occurrences="9" value="èn" /> + <ngram occurrences="9" value="ut" /> + <ngram occurrences="9" value="u_v" /> + <ngram occurrences="9" value="sta" /> + <ngram occurrences="9" value="rn" /> + <ngram occurrences="9" value="rav" /> + <ngram occurrences="9" value="o_d" /> + <ngram occurrences="9" value="nos" /> + <ngram occurrences="9" value="n_" /> + <ngram occurrences="9" value="mo" /> + <ngram occurrences="9" value="mi" /> + <ngram occurrences="9" value="ký" /> + <ngram occurrences="9" value="is" /> + <ngram occurrences="9" value="hl" /> + <ngram occurrences="9" value="ep" /> + <ngram occurrences="9" value="em_" /> + <ngram occurrences="9" value="ec" /> + <ngram occurrences="9" value="e_s" /> + <ngram occurrences="9" value="e_n" /> + <ngram occurrences="9" value="dì" /> + <ngram occurrences="9" value="dy" /> + <ngram occurrences="9" value="di" /> + <ngram occurrences="9" value="de" /> + <ngram occurrences="9" value="d_" /> + <ngram occurrences="9" value="ar" /> + <ngram occurrences="9" value="ah" /> + <ngram occurrences="9" value="ac" /> + <ngram occurrences="9" value="_ÿ" /> + <ngram occurrences="9" value="_ve" /> + <ngram occurrences="9" value="_u" /> + <ngram occurrences="9" value="_to_" /> + <ngram occurrences="9" value="_pøi" /> + <ngram occurrences="8" value="ých_" /> + <ngram occurrences="8" value="ých" /> + <ngram occurrences="8" value="ýc" /> + <ngram occurrences="8" value="ím_" /> + <ngram occurrences="8" value="áv" /> + <ngram occurrences="8" value="zn" /> + <ngram occurrences="8" value="yl" /> + <ngram occurrences="8" value="vé_" /> + <ngram occurrences="8" value="vá" /> + <ngram occurrences="8" value="vi" /> + <ngram occurrences="8" value="u_p" /> + <ngram occurrences="8" value="tv" /> + <ngram occurrences="8" value="ského" /> + <ngram occurrences="8" value="skéh" /> + <ngram occurrences="8" value="prav" /> + <ngram occurrences="8" value="pa" /> + <ngram occurrences="8" value="op" /> + <ngram occurrences="8" value="ok" /> + <ngram occurrences="8" value="ny_" /> + <ngram occurrences="8" value="ny" /> + <ngram occurrences="8" value="nost" /> + <ngram occurrences="8" value="kého_" /> + <ngram occurrences="8" value="kého" /> + <ngram occurrences="8" value="kéh" /> + <ngram occurrences="8" value="ky_" /> + <ngram occurrences="8" value="jí" /> + <ngram occurrences="8" value="ja" /> + <ngram occurrences="8" value="il_" /> + <ngram occurrences="8" value="hod" /> + <ngram occurrences="8" value="du" /> + <ngram occurrences="8" value="co" /> + <ngram occurrences="8" value="ce_" /> + <ngram occurrences="8" value="bu" /> + <ngram occurrences="8" value="az" /> + <ngram occurrences="8" value="am" /> + <ngram occurrences="8" value="_ÿe_" /> + <ngram occurrences="8" value="_ÿe" /> + <ngram occurrences="8" value="_èe" /> + <ngram occurrences="7" value="ìl" /> + <ngram occurrences="7" value="áz" /> + <ngram occurrences="7" value="ás" /> + <ngram occurrences="7" value="ál" /> + <ngram occurrences="7" value="¹í" /> + <ngram occurrences="7" value="zu" /> + <ngram occurrences="7" value="zp" /> + <ngram occurrences="7" value="ze_" /> + <ngram occurrences="7" value="ví" /> + <ngram occurrences="7" value="vn" /> + <ngram occurrences="7" value="vat" /> + <ngram occurrences="7" value="ud" /> + <ngram occurrences="7" value="tá" /> + <ngram occurrences="7" value="ty" /> + <ngram occurrences="7" value="tu_" /> + <ngram occurrences="7" value="spo" /> + <ngram occurrences="7" value="sp" /> + <ngram occurrences="7" value="sov" /> + <ngram occurrences="7" value="sou" /> + <ngram occurrences="7" value="roz" /> + <ngram occurrences="7" value="pøed" /> + <ngram occurrences="7" value="pol" /> + <ngram occurrences="7" value="ové" /> + <ngram occurrences="7" value="o_v" /> + <ngram occurrences="7" value="ns" /> + <ngram occurrences="7" value="me" /> + <ngram occurrences="7" value="m_p" /> + <ngram occurrences="7" value="ká" /> + <ngram occurrences="7" value="kr" /> + <ngram occurrences="7" value="kon" /> + <ngram occurrences="7" value="kl" /> + <ngram occurrences="7" value="kd" /> + <ngram occurrences="7" value="hr" /> + <ngram occurrences="7" value="ev" /> + <ngram occurrences="7" value="est" /> + <ngram occurrences="7" value="dy_" /> + <ngram occurrences="7" value="du_" /> + <ngram occurrences="7" value="dl" /> + <ngram occurrences="7" value="ck" /> + <ngram occurrences="7" value="cho" /> + <ngram occurrences="7" value="byl" /> + <ngram occurrences="7" value="ate" /> + <ngram occurrences="7" value="_zá" /> + <ngram occurrences="7" value="_vý" /> + <ngram occurrences="7" value="_pøed" /> + <ngram occurrences="7" value="_pod" /> + <ngram occurrences="7" value="_od" /> + <ngram occurrences="7" value="_ob" /> + <ngram occurrences="7" value="_ná" /> + <ngram occurrences="7" value="_je_" /> + <ngram occurrences="6" value="ým" /> + <ngram occurrences="6" value="ího" /> + <ngram occurrences="6" value="íh" /> + <ngram occurrences="6" value="í_p" /> + <ngram occurrences="6" value="èi" /> + <ngram occurrences="6" value="èesk" /> + <ngram occurrences="6" value="èes" /> + <ngram occurrences="6" value="ání" /> + <ngram occurrences="6" value="ám" /> + <ngram occurrences="6" value="zi" /> + <ngram occurrences="6" value="zah" /> + <ngram occurrences="6" value="z_" /> + <ngram occurrences="6" value="y_v" /> + <ngram occurrences="6" value="y_s" /> + <ngram occurrences="6" value="y_p" /> + <ngram occurrences="6" value="vìt" /> + <ngram occurrences="6" value="v¹" /> + <ngram occurrences="6" value="vr" /> + <ngram occurrences="6" value="vní" /> + <ngram occurrences="6" value="va_" /> + <ngram occurrences="6" value="um" /> + <ngram occurrences="6" value="uj" /> + <ngram occurrences="6" value="u_n" /> + <ngram occurrences="6" value="u_a" /> + <ngram occurrences="6" value="ty_" /> + <ngram occurrences="6" value="tk" /> + <ngram occurrences="6" value="tel" /> + <ngram occurrences="6" value="tak" /> + <ngram occurrences="6" value="sti" /> + <ngram occurrences="6" value="st_" /> + <ngram occurrences="6" value="si" /> + <ngram occurrences="6" value="sa" /> + <ngram occurrences="6" value="s_p" /> + <ngram occurrences="6" value="ri" /> + <ngram occurrences="6" value="rad" /> + <ngram occurrences="6" value="r_" /> + <ngram occurrences="6" value="ovì" /> + <ngram occurrences="6" value="ova" /> + <ngram occurrences="6" value="ost_" /> + <ngram occurrences="6" value="oru" /> + <ngram occurrences="6" value="odu" /> + <ngram occurrences="6" value="o_ne" /> + <ngram occurrences="6" value="o_k" /> + <ngram occurrences="6" value="ný" /> + <ngram occurrences="6" value="ním" /> + <ngram occurrences="6" value="nsk" /> + <ngram occurrences="6" value="l_p" /> +</ngrams> diff --git a/src/plugins/language/danish.klp b/src/plugins/language/danish.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="652" value="_" /> + <ngram occurrences="623" value="e" /> + <ngram occurrences="341" value="r" /> + <ngram occurrences="290" value="n" /> + <ngram occurrences="260" value="t" /> + <ngram occurrences="234" value="s" /> + <ngram occurrences="227" value="i" /> + <ngram occurrences="219" value="a" /> + <ngram occurrences="204" value="d" /> + <ngram occurrences="192" value="l" /> + <ngram occurrences="183" value="o" /> + <ngram occurrences="156" value="g" /> + <ngram occurrences="143" value="e_" /> + <ngram occurrences="138" value="er" /> + <ngram occurrences="137" value="k" /> + <ngram occurrences="119" value="de" /> + <ngram occurrences="108" value="r_" /> + <ngram occurrences="105" value="en" /> + <ngram occurrences="103" value="f" /> + <ngram occurrences="100" value="m" /> + <ngram occurrences="93" value="t_" /> + <ngram occurrences="80" value="er_" /> + <ngram occurrences="80" value="_d" /> + <ngram occurrences="75" value="n_" /> + <ngram occurrences="71" value="b" /> + <ngram occurrences="70" value="v" /> + <ngram occurrences="63" value="u" /> + <ngram occurrences="63" value="_a" /> + <ngram occurrences="62" value="re" /> + <ngram occurrences="61" value="_de" /> + <ngram occurrences="60" value="h" /> + <ngram occurrences="57" value="et" /> + <ngram occurrences="55" value="_e" /> + <ngram occurrences="54" value="te" /> + <ngram occurrences="53" value="_s" /> + <ngram occurrences="51" value="ge" /> + <ngram occurrences="50" value="_f" /> + <ngram occurrences="49" value="st" /> + <ngram occurrences="49" value="g_" /> + <ngram occurrences="48" value="se" /> + <ngram occurrences="48" value="in" /> + <ngram occurrences="47" value="et_" /> + <ngram occurrences="47" value="en_" /> + <ngram occurrences="47" value="el" /> + <ngram occurrences="44" value="le" /> + <ngram occurrences="44" value="_o" /> + <ngram occurrences="43" value="p" /> + <ngram occurrences="42" value="ng" /> + <ngram occurrences="42" value="ar" /> + <ngram occurrences="42" value="an" /> + <ngram occurrences="41" value="or" /> + <ngram occurrences="40" value="ri" /> + <ngram occurrences="38" value="nd" /> + <ngram occurrences="38" value="_k" /> + <ngram occurrences="37" value="og" /> + <ngram occurrences="36" value="c" /> + <ngram occurrences="36" value="_i" /> + <ngram occurrences="35" value="æ" /> + <ngram occurrences="35" value="ti" /> + <ngram occurrences="35" value="s_" /> + <ngram occurrences="34" value="ø" /> + <ngram occurrences="33" value="ne" /> + <ngram occurrences="32" value="fo" /> + <ngram occurrences="32" value="der" /> + <ngram occurrences="32" value="_t" /> + <ngram occurrences="31" value="sk" /> + <ngram occurrences="31" value="og_" /> + <ngram occurrences="31" value="ke" /> + <ngram occurrences="31" value="de_" /> + <ngram occurrences="28" value="is" /> + <ngram occurrences="28" value="for" /> + <ngram occurrences="27" value="es" /> + <ngram occurrences="27" value="be" /> + <ngram occurrences="27" value="_og" /> + <ngram occurrences="26" value="li" /> + <ngram occurrences="26" value="_og_" /> + <ngram occurrences="26" value="_m" /> + <ngram occurrences="26" value="_b" /> + <ngram occurrences="25" value="ma" /> + <ngram occurrences="25" value="d_" /> + <ngram occurrences="25" value="af" /> + <ngram occurrences="25" value="_v" /> + <ngram occurrences="25" value="_fo" /> + <ngram occurrences="24" value="ing" /> + <ngram occurrences="24" value="al" /> + <ngram occurrences="23" value="ve" /> + <ngram occurrences="23" value="un" /> + <ngram occurrences="23" value="j" /> + <ngram occurrences="23" value="i_" /> + <ngram occurrences="23" value="f_" /> + <ngram occurrences="23" value="at" /> + <ngram occurrences="23" value="_for" /> + <ngram occurrences="22" value="ld" /> + <ngram occurrences="22" value="il" /> + <ngram occurrences="22" value="der_" /> + <ngram occurrences="21" value="rs" /> + <ngram occurrences="21" value="re_" /> + <ngram occurrences="21" value="ns" /> + <ngram occurrences="21" value="ls" /> + <ngram occurrences="21" value="ko" /> + <ngram occurrences="21" value="af_" /> + <ngram occurrences="21" value="_af_" /> + <ngram occurrences="21" value="_af" /> + <ngram occurrences="20" value="y" /> + <ngram occurrences="20" value="nde" /> + <ngram occurrences="20" value="ll" /> + <ngram occurrences="20" value="_p" /> + <ngram occurrences="19" value="nge" /> + <ngram occurrences="19" value="els" /> + <ngram occurrences="19" value="det" /> + <ngram occurrences="19" value="ch" /> + <ngram occurrences="19" value="_i_" /> + <ngram occurrences="18" value="on" /> + <ngram occurrences="18" value="me" /> + <ngram occurrences="18" value="ere" /> + <ngram occurrences="18" value="den" /> + <ngram occurrences="18" value="ag" /> + <ngram occurrences="18" value="_en" /> + <ngram occurrences="17" value="ol" /> + <ngram occurrences="17" value="lse" /> + <ngram occurrences="17" value="ke_" /> + <ngram occurrences="17" value="ig" /> + <ngram occurrences="17" value="id" /> + <ngram occurrences="17" value="else" /> + <ngram occurrences="17" value="det_" /> + <ngram occurrences="17" value="_ko" /> + <ngram occurrences="17" value="_det" /> + <ngram occurrences="16" value="rt" /> + <ngram occurrences="16" value="ra" /> + <ngram occurrences="16" value="om" /> + <ngram occurrences="16" value="k_" /> + <ngram occurrences="16" value="ik" /> + <ngram occurrences="16" value="ge_" /> + <ngram occurrences="16" value="ev" /> + <ngram occurrences="16" value="e_d" /> + <ngram occurrences="16" value="_u" /> + <ngram occurrences="16" value="_er" /> + <ngram occurrences="15" value="w" /> + <ngram occurrences="15" value="til" /> + <ngram occurrences="15" value="ta" /> + <ngram occurrences="15" value="ser" /> + <ngram occurrences="15" value="r_d" /> + <ngram occurrences="15" value="m_" /> + <ngram occurrences="15" value="lle" /> + <ngram occurrences="15" value="ha" /> + <ngram occurrences="15" value="em" /> + <ngram occurrences="15" value="_h" /> + <ngram occurrences="15" value="_er_" /> + <ngram occurrences="15" value="_det_" /> + <ngram occurrences="14" value="å" /> + <ngram occurrences="14" value="sti" /> + <ngram occurrences="14" value="ris" /> + <ngram occurrences="14" value="ng_" /> + <ngram occurrences="14" value="ist" /> + <ngram occurrences="14" value="eg" /> + <ngram occurrences="14" value="ed" /> + <ngram occurrences="14" value="e_e" /> + <ngram occurrences="14" value="am" /> + <ngram occurrences="13" value="und" /> + <ngram occurrences="13" value="ter" /> + <ngram occurrences="13" value="ske" /> + <ngram occurrences="13" value="rk" /> + <ngram occurrences="13" value="r_de" /> + <ngram occurrences="13" value="op" /> + <ngram occurrences="13" value="ing_" /> + <ngram occurrences="13" value="e_a" /> + <ngram occurrences="13" value="an_" /> + <ngram occurrences="13" value="_de_" /> + <ngram occurrences="12" value="ør" /> + <ngram occurrences="12" value="to" /> + <ngram occurrences="12" value="ser_" /> + <ngram occurrences="12" value="rist" /> + <ngram occurrences="12" value="rin" /> + <ngram occurrences="12" value="or_" /> + <ngram occurrences="12" value="nt" /> + <ngram occurrences="12" value="la" /> + <ngram occurrences="12" value="l_" /> + <ngram occurrences="12" value="ie" /> + <ngram occurrences="12" value="da" /> + <ngram occurrences="12" value="br" /> + <ngram occurrences="12" value="at_" /> + <ngram occurrences="12" value="_l" /> + <ngram occurrences="12" value="_der" /> + <ngram occurrences="12" value="_at_" /> + <ngram occurrences="12" value="_at" /> + <ngram occurrences="11" value="vi" /> + <ngram occurrences="11" value="tr" /> + <ngram occurrences="11" value="t_d" /> + <ngram occurrences="11" value="si" /> + <ngram occurrences="11" value="ro" /> + <ngram occurrences="11" value="ren" /> + <ngram occurrences="11" value="r_f" /> + <ngram occurrences="11" value="r_e" /> + <ngram occurrences="11" value="old" /> + <ngram occurrences="11" value="ne_" /> + <ngram occurrences="11" value="kr" /> + <ngram occurrences="11" value="kon" /> + <ngram occurrences="11" value="kke" /> + <ngram occurrences="11" value="kk" /> + <ngram occurrences="11" value="ige" /> + <ngram occurrences="11" value="gt" /> + <ngram occurrences="11" value="es_" /> + <ngram occurrences="11" value="ers" /> + <ngram occurrences="11" value="eri" /> + <ngram occurrences="11" value="ens" /> + <ngram occurrences="11" value="end" /> + <ngram occurrences="11" value="e_de" /> + <ngram occurrences="11" value="e_b" /> + <ngram occurrences="11" value="ce" /> + <ngram occurrences="11" value="_der_" /> + <ngram occurrences="10" value="te_" /> + <ngram occurrences="10" value="ste" /> + <ngram occurrences="10" value="ske_" /> + <ngram occurrences="10" value="sen" /> + <ngram occurrences="10" value="se_" /> + <ngram occurrences="10" value="ring" /> + <ngram occurrences="10" value="r_s" /> + <ngram occurrences="10" value="ni" /> + <ngram occurrences="10" value="n_a" /> + <ngram occurrences="10" value="ler" /> + <ngram occurrences="10" value="il_" /> + <ngram occurrences="10" value="hr" /> + <ngram occurrences="10" value="ho" /> + <ngram occurrences="10" value="ger" /> + <ngram occurrences="10" value="gen" /> + <ngram occurrences="10" value="fr" /> + <ngram occurrences="10" value="for_" /> + <ngram occurrences="10" value="e_f" /> + <ngram occurrences="10" value="di" /> + <ngram occurrences="10" value="den_" /> + <ngram occurrences="10" value="ark" /> + <ngram occurrences="10" value="_w" /> + <ngram occurrences="10" value="_til" /> + <ngram occurrences="10" value="_ti" /> + <ngram occurrences="10" value="_st" /> + <ngram occurrences="10" value="_ma" /> + <ngram occurrences="10" value="_j" /> + <ngram occurrences="10" value="_den" /> + <ngram occurrences="10" value="_c" /> + <ngram occurrences="10" value="_ar" /> + <ngram occurrences="9" value="ær" /> + <ngram occurrences="9" value="va" /> + <ngram occurrences="9" value="til_" /> + <ngram occurrences="9" value="t_s" /> + <ngram occurrences="9" value="t_e" /> + <ngram occurrences="9" value="t_de" /> + <ngram occurrences="9" value="so" /> + <ngram occurrences="9" value="rd" /> + <ngram occurrences="9" value="r_o" /> + <ngram occurrences="9" value="pr" /> + <ngram occurrences="9" value="nder" /> + <ngram occurrences="9" value="lse_" /> + <ngram occurrences="9" value="lig" /> + <ngram occurrences="9" value="ki" /> + <ngram occurrences="9" value="ide" /> + <ngram occurrences="9" value="er_o" /> + <ngram occurrences="9" value="ene" /> + <ngram occurrences="9" value="else_" /> + <ngram occurrences="9" value="ek" /> + <ngram occurrences="9" value="eb" /> + <ngram occurrences="9" value="e_s" /> + <ngram occurrences="9" value="_un" /> + <ngram occurrences="9" value="_g" /> + <ngram occurrences="9" value="_fr" /> + <ngram occurrences="9" value="_for_" /> + <ngram occurrences="8" value="v_" /> + <ngram occurrences="8" value="unde" /> + <ngram occurrences="8" value="tt" /> + <ngram occurrences="8" value="t_i" /> + <ngram occurrences="8" value="t_a" /> + <ngram occurrences="8" value="sto" /> + <ngram occurrences="8" value="sc" /> + <ngram occurrences="8" value="sa" /> + <ngram occurrences="8" value="risti" /> + <ngram occurrences="8" value="r_i" /> + <ngram occurrences="8" value="ot" /> + <ngram occurrences="8" value="ns_" /> + <ngram occurrences="8" value="nn" /> + <ngram occurrences="8" value="nd_" /> + <ngram occurrences="8" value="nc" /> + <ngram occurrences="8" value="n_d" /> + <ngram occurrences="8" value="mi" /> + <ngram occurrences="8" value="lin" /> + <ngram occurrences="8" value="le_" /> + <ngram occurrences="8" value="lde" /> + <ngram occurrences="8" value="ka" /> + <ngram occurrences="8" value="isti" /> + <ngram occurrences="8" value="ikke" /> + <ngram occurrences="8" value="ikk" /> + <ngram occurrences="8" value="ia" /> + <ngram occurrences="8" value="hri" /> + <ngram occurrences="8" value="hol" /> + <ngram occurrences="8" value="he" /> + <ngram occurrences="8" value="gs" /> + <ngram occurrences="8" value="gel" /> + <ngram occurrences="8" value="g_s" /> + <ngram occurrences="8" value="ft" /> + <ngram occurrences="8" value="ere_" /> + <ngram occurrences="8" value="er_e" /> + <ngram occurrences="8" value="er_d" /> + <ngram occurrences="8" value="ent" /> + <ngram occurrences="8" value="ens_" /> + <ngram occurrences="8" value="en_a" /> + <ngram occurrences="8" value="e_o" /> + <ngram occurrences="8" value="e_for" /> + <ngram occurrences="8" value="e_fo" /> + <ngram occurrences="8" value="del" /> + <ngram occurrences="8" value="chri" /> + <ngram occurrences="8" value="chr" /> + <ngram occurrences="8" value="av" /> + <ngram occurrences="8" value="ar_" /> + <ngram occurrences="8" value="ale" /> + <ngram occurrences="8" value="age" /> + <ngram occurrences="8" value="_und" /> + <ngram occurrences="8" value="_til_" /> + <ngram occurrences="8" value="_sk" /> + <ngram occurrences="8" value="_si" /> + <ngram occurrences="8" value="_et_" /> + <ngram occurrences="8" value="_et" /> + <ngram occurrences="8" value="_en_" /> + <ngram occurrences="8" value="_da" /> + <ngram occurrences="7" value="æl" /> + <ngram occurrences="7" value="ver" /> + <ngram occurrences="7" value="us" /> + <ngram occurrences="7" value="ud" /> + <ngram occurrences="7" value="ts" /> + <ngram occurrences="7" value="tel" /> + <ngram occurrences="7" value="t_k" /> + <ngram occurrences="7" value="skr" /> + <ngram occurrences="7" value="sch" /> + <ngram occurrences="7" value="rn" /> + <ngram occurrences="7" value="ret" /> + <ngram occurrences="7" value="rb" /> + <ngram occurrences="7" value="r_a" /> + <ngram occurrences="7" value="ov" /> + <ngram occurrences="7" value="ote" /> + <ngram occurrences="7" value="ors" /> + <ngram occurrences="7" value="om_" /> + <ngram occurrences="7" value="nne" /> + <ngram occurrences="7" value="nce" /> + <ngram occurrences="7" value="mar" /> + <ngram occurrences="7" value="kt" /> + <ngram occurrences="7" value="kke_" /> + <ngram occurrences="7" value="ind" /> + <ngram occurrences="7" value="in_" /> + <ngram occurrences="7" value="ikke_" /> + <ngram occurrences="7" value="ige_" /> + <ngram occurrences="7" value="hrist" /> + <ngram occurrences="7" value="hris" /> + <ngram occurrences="7" value="hold" /> + <ngram occurrences="7" value="gr" /> + <ngram occurrences="7" value="ger_" /> + <ngram occurrences="7" value="gen_" /> + <ngram occurrences="7" value="g_e" /> + <ngram occurrences="7" value="g_a" /> + <ngram occurrences="7" value="er_s" /> + <ngram occurrences="7" value="er_de" /> + <ngram occurrences="7" value="ende" /> + <ngram occurrences="7" value="ed_" /> + <ngram occurrences="7" value="e_v" /> + <ngram occurrences="7" value="e_t" /> + <ngram occurrences="7" value="e_l" /> + <ngram occurrences="7" value="e_i" /> + <ngram occurrences="7" value="ds" /> + <ngram occurrences="7" value="dan" /> + <ngram occurrences="7" value="chris" /> + <ngram occurrences="7" value="bl" /> + <ngram occurrences="7" value="all" /> + <ngram occurrences="7" value="_vi" /> + <ngram occurrences="7" value="_va" /> + <ngram occurrences="7" value="_te" /> + <ngram occurrences="7" value="_r" /> + <ngram occurrences="7" value="_pr" /> + <ngram occurrences="7" value="_n" /> + <ngram occurrences="7" value="_me" /> + <ngram occurrences="7" value="_kon" /> + <ngram occurrences="7" value="_in" /> + <ngram occurrences="7" value="_ikke" /> + <ngram occurrences="7" value="_ikk" /> + <ngram occurrences="7" value="_ik" /> + <ngram occurrences="7" value="_di" /> + <ngram occurrences="7" value="_chri" /> + <ngram occurrences="7" value="_chr" /> + <ngram occurrences="7" value="_ch" /> + <ngram occurrences="7" value="_br" /> + <ngram occurrences="7" value="_be" /> + <ngram occurrences="6" value="æn" /> + <ngram occurrences="6" value="å_" /> + <ngram occurrences="6" value="væ" /> + <ngram occurrences="6" value="var_" /> + <ngram occurrences="6" value="var" /> + <ngram occurrences="6" value="under" /> + <ngram occurrences="6" value="tte" /> + <ngram occurrences="6" value="tian_" /> + <ngram occurrences="6" value="tian" /> + <ngram occurrences="6" value="tia" /> + <ngram occurrences="6" value="ter_" /> + <ngram occurrences="6" value="ten" /> + <ngram occurrences="6" value="tal" /> + <ngram occurrences="6" value="t_v" /> +</ngrams> diff --git a/src/plugins/language/dutch.klp b/src/plugins/language/dutch.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="771" value="_" /> + <ngram occurrences="769" value="e" /> + <ngram occurrences="425" value="n" /> + <ngram occurrences="302" value="t" /> + <ngram occurrences="293" value="a" /> + <ngram occurrences="282" value="i" /> + <ngram occurrences="256" value="r" /> + <ngram occurrences="242" value="d" /> + <ngram occurrences="221" value="n_" /> + <ngram occurrences="214" value="o" /> + <ngram occurrences="181" value="en" /> + <ngram occurrences="168" value="s" /> + <ngram occurrences="139" value="g" /> + <ngram occurrences="139" value="e_" /> + <ngram occurrences="137" value="l" /> + <ngram occurrences="137" value="en_" /> + <ngram occurrences="133" value="t_" /> + <ngram occurrences="122" value="de" /> + <ngram occurrences="117" value="er" /> + <ngram occurrences="110" value="v" /> + <ngram occurrences="103" value="u" /> + <ngram occurrences="96" value="k" /> + <ngram occurrences="93" value="_d" /> + <ngram occurrences="92" value="h" /> + <ngram occurrences="81" value="an" /> + <ngram occurrences="79" value="j" /> + <ngram occurrences="78" value="_v" /> + <ngram occurrences="76" value="m" /> + <ngram occurrences="74" value="ge" /> + <ngram occurrences="71" value="b" /> + <ngram occurrences="70" value="in" /> + <ngram occurrences="68" value="r_" /> + <ngram occurrences="67" value="et" /> + <ngram occurrences="65" value="z" /> + <ngram occurrences="64" value="te" /> + <ngram occurrences="59" value="p" /> + <ngram occurrences="56" value="ij" /> + <ngram occurrences="56" value="_e" /> + <ngram occurrences="54" value="st" /> + <ngram occurrences="52" value="de_" /> + <ngram occurrences="52" value="_h" /> + <ngram occurrences="51" value="aa" /> + <ngram occurrences="50" value="w" /> + <ngram occurrences="50" value="ie" /> + <ngram occurrences="50" value="et_" /> + <ngram occurrences="50" value="_z" /> + <ngram occurrences="48" value="ee" /> + <ngram occurrences="48" value="_de" /> + <ngram occurrences="47" value="an_" /> + <ngram occurrences="43" value="s_" /> + <ngram occurrences="43" value="el" /> + <ngram occurrences="41" value="he" /> + <ngram occurrences="40" value="ve" /> + <ngram occurrences="40" value="_o" /> + <ngram occurrences="40" value="_de_" /> + <ngram occurrences="40" value="_b" /> + <ngram occurrences="38" value="er_" /> + <ngram occurrences="38" value="c" /> + <ngram occurrences="38" value="_s" /> + <ngram occurrences="38" value="_i" /> + <ngram occurrences="37" value="at" /> + <ngram occurrences="37" value="_m" /> + <ngram occurrences="37" value="_a" /> + <ngram occurrences="36" value="le" /> + <ngram occurrences="36" value="be" /> + <ngram occurrences="36" value="ar" /> + <ngram occurrences="36" value="_g" /> + <ngram occurrences="35" value="ng" /> + <ngram occurrences="35" value="den" /> + <ngram occurrences="35" value="_he" /> + <ngram occurrences="33" value="va" /> + <ngram occurrences="33" value="ni" /> + <ngram occurrences="32" value="or" /> + <ngram occurrences="32" value="oo" /> + <ngram occurrences="31" value="nt" /> + <ngram occurrences="31" value="g_" /> + <ngram occurrences="31" value="_va" /> + <ngram occurrences="30" value="van" /> + <ngram occurrences="30" value="nd" /> + <ngram occurrences="30" value="n_d" /> + <ngram occurrences="30" value="da" /> + <ngram occurrences="30" value="d_" /> + <ngram occurrences="29" value="ver" /> + <ngram occurrences="29" value="van_" /> + <ngram occurrences="29" value="ud" /> + <ngram occurrences="29" value="re" /> + <ngram occurrences="29" value="_w" /> + <ngram occurrences="29" value="_k" /> + <ngram occurrences="28" value="tu" /> + <ngram occurrences="28" value="_van" /> + <ngram occurrences="27" value="ze" /> + <ngram occurrences="27" value="ri" /> + <ngram occurrences="27" value="ing" /> + <ngram occurrences="27" value="di" /> + <ngram occurrences="27" value="_van_" /> + <ngram occurrences="27" value="_t" /> + <ngram occurrences="26" value="vo" /> + <ngram occurrences="26" value="stu" /> + <ngram occurrences="26" value="n_v" /> + <ngram occurrences="26" value="_st" /> + <ngram occurrences="25" value="zi" /> + <ngram occurrences="25" value="het" /> + <ngram occurrences="25" value="at_" /> + <ngram occurrences="25" value="al" /> + <ngram occurrences="25" value="_zi" /> + <ngram occurrences="25" value="_in" /> + <ngram occurrences="25" value="_het" /> + <ngram occurrences="25" value="_ge" /> + <ngram occurrences="25" value="_be" /> + <ngram occurrences="24" value="on" /> + <ngram occurrences="24" value="het_" /> + <ngram occurrences="24" value="gen" /> + <ngram occurrences="24" value="ch" /> + <ngram occurrences="24" value="aar" /> + <ngram occurrences="24" value="_het_" /> + <ngram occurrences="24" value="_da" /> + <ngram occurrences="23" value="rd" /> + <ngram occurrences="23" value="li" /> + <ngram occurrences="23" value="ke" /> + <ngram occurrences="23" value="k_" /> + <ngram occurrences="23" value="f" /> + <ngram occurrences="23" value="es" /> + <ngram occurrences="22" value="ude" /> + <ngram occurrences="22" value="tud" /> + <ngram occurrences="22" value="ti" /> + <ngram occurrences="22" value="stud" /> + <ngram occurrences="22" value="is" /> + <ngram occurrences="22" value="_vo" /> + <ngram occurrences="22" value="_stu" /> + <ngram occurrences="21" value="t_d" /> + <ngram occurrences="21" value="op" /> + <ngram occurrences="21" value="it" /> + <ngram occurrences="21" value="den_" /> + <ngram occurrences="20" value="we" /> + <ngram occurrences="20" value="ra" /> + <ngram occurrences="20" value="oe" /> + <ngram occurrences="20" value="me" /> + <ngram occurrences="20" value="ed" /> + <ngram occurrences="20" value="_ve" /> + <ngram occurrences="20" value="_stud" /> + <ngram occurrences="19" value="_en_" /> + <ngram occurrences="19" value="_en" /> + <ngram occurrences="19" value="_ee" /> + <ngram occurrences="18" value="ui" /> + <ngram occurrences="18" value="uden" /> + <ngram occurrences="18" value="ten" /> + <ngram occurrences="18" value="se" /> + <ngram occurrences="18" value="ro" /> + <ngram occurrences="18" value="oor" /> + <ngram occurrences="18" value="ne" /> + <ngram occurrences="18" value="l_" /> + <ngram occurrences="18" value="gen_" /> + <ngram occurrences="18" value="een" /> + <ngram occurrences="18" value="dat_" /> + <ngram occurrences="18" value="dat" /> + <ngram occurrences="18" value="_ver" /> + <ngram occurrences="17" value="n_z" /> + <ngram occurrences="17" value="ie_" /> + <ngram occurrences="17" value="eg" /> + <ngram occurrences="17" value="eer" /> + <ngram occurrences="17" value="een_" /> + <ngram occurrences="17" value="der" /> + <ngram occurrences="17" value="_n" /> + <ngram occurrences="17" value="_j" /> + <ngram occurrences="17" value="_een" /> + <ngram occurrences="16" value="zij" /> + <ngram occurrences="16" value="ten_" /> + <ngram occurrences="16" value="te_" /> + <ngram occurrences="16" value="rs" /> + <ngram occurrences="16" value="nte" /> + <ngram occurrences="16" value="nge" /> + <ngram occurrences="16" value="nde" /> + <ngram occurrences="16" value="n_de" /> + <ngram occurrences="16" value="jn" /> + <ngram occurrences="16" value="ijn" /> + <ngram occurrences="16" value="eu" /> + <ngram occurrences="16" value="ent" /> + <ngram occurrences="16" value="e_v" /> + <ngram occurrences="16" value="_zij" /> + <ngram occurrences="16" value="_l" /> + <ngram occurrences="16" value="_een_" /> + <ngram occurrences="15" value="tude" /> + <ngram occurrences="15" value="stude" /> + <ngram occurrences="15" value="pa" /> + <ngram occurrences="15" value="p_" /> + <ngram occurrences="15" value="ng_" /> + <ngram occurrences="15" value="n_de_" /> + <ngram occurrences="15" value="je" /> + <ngram occurrences="15" value="en_v" /> + <ngram occurrences="15" value="en_d" /> + <ngram occurrences="15" value="ek" /> + <ngram occurrences="15" value="die" /> + <ngram occurrences="15" value="_dat_" /> + <ngram occurrences="15" value="_dat" /> + <ngram occurrences="14" value="zijn_" /> + <ngram occurrences="14" value="zijn" /> + <ngram occurrences="14" value="un" /> + <ngram occurrences="14" value="ste" /> + <ngram occurrences="14" value="ns" /> + <ngram occurrences="14" value="n_s" /> + <ngram occurrences="14" value="ma" /> + <ngram occurrences="14" value="jn_" /> + <ngram occurrences="14" value="in_" /> + <ngram occurrences="14" value="ijn_" /> + <ngram occurrences="14" value="gel" /> + <ngram occurrences="14" value="en_z" /> + <ngram occurrences="14" value="ar_" /> + <ngram occurrences="14" value="aar_" /> + <ngram occurrences="14" value="aan" /> + <ngram occurrences="14" value="_zijn" /> + <ngram occurrences="14" value="_ze" /> + <ngram occurrences="14" value="_p" /> + <ngram occurrences="13" value="ze_" /> + <ngram occurrences="13" value="t_e" /> + <ngram occurrences="13" value="sc" /> + <ngram occurrences="13" value="ot" /> + <ngram occurrences="13" value="nie" /> + <ngram occurrences="13" value="n_o" /> + <ngram occurrences="13" value="n_h" /> + <ngram occurrences="13" value="mo" /> + <ngram occurrences="13" value="la" /> + <ngram occurrences="13" value="je_" /> + <ngram occurrences="13" value="ho" /> + <ngram occurrences="13" value="erd" /> + <ngram occurrences="13" value="ei" /> + <ngram occurrences="13" value="an_d" /> + <ngram occurrences="13" value="_op" /> + <ngram occurrences="13" value="_in_" /> + <ngram occurrences="13" value="_al" /> + <ngram occurrences="12" value="wa" /> + <ngram occurrences="12" value="voor" /> + <ngram occurrences="12" value="voo" /> + <ngram occurrences="12" value="ta" /> + <ngram occurrences="12" value="rt" /> + <ngram occurrences="12" value="om" /> + <ngram occurrences="12" value="n_w" /> + <ngram occurrences="12" value="ll" /> + <ngram occurrences="12" value="lij" /> + <ngram occurrences="12" value="jk" /> + <ngram occurrences="12" value="inge" /> + <ngram occurrences="12" value="ijk" /> + <ngram occurrences="12" value="ic" /> + <ngram occurrences="12" value="ente" /> + <ngram occurrences="12" value="aan_" /> + <ngram occurrences="12" value="_voor" /> + <ngram occurrences="12" value="_voo" /> + <ngram occurrences="12" value="_u" /> + <ngram occurrences="12" value="_te" /> + <ngram occurrences="11" value="zo" /> + <ngram occurrences="11" value="udent" /> + <ngram occurrences="11" value="tuden" /> + <ngram occurrences="11" value="to" /> + <ngram occurrences="11" value="ter" /> + <ngram occurrences="11" value="t_de" /> + <ngram occurrences="11" value="sch" /> + <ngram occurrences="11" value="rde" /> + <ngram occurrences="11" value="or_" /> + <ngram occurrences="11" value="op_" /> + <ngram occurrences="11" value="oor_" /> + <ngram occurrences="11" value="ol" /> + <ngram occurrences="11" value="n_ve" /> + <ngram occurrences="11" value="n_e" /> + <ngram occurrences="11" value="n_a" /> + <ngram occurrences="11" value="lijk" /> + <ngram occurrences="11" value="ing_" /> + <ngram occurrences="11" value="ers" /> + <ngram occurrences="11" value="en_o" /> + <ngram occurrences="11" value="el_" /> + <ngram occurrences="11" value="e_o" /> + <ngram occurrences="11" value="dent" /> + <ngram occurrences="11" value="ag" /> + <ngram occurrences="11" value="ad" /> + <ngram occurrences="11" value="_mo" /> + <ngram occurrences="11" value="_me" /> + <ngram occurrences="11" value="_je_" /> + <ngram occurrences="11" value="_je" /> + <ngram occurrences="10" value="t_z" /> + <ngram occurrences="10" value="t_m" /> + <ngram occurrences="10" value="t_de_" /> + <ngram occurrences="10" value="t_be" /> + <ngram occurrences="10" value="t_b" /> + <ngram occurrences="10" value="r_d" /> + <ngram occurrences="10" value="ou" /> + <ngram occurrences="10" value="nt_" /> + <ngram occurrences="10" value="nder" /> + <ngram occurrences="10" value="n_zi" /> + <ngram occurrences="10" value="n_ver" /> + <ngram occurrences="10" value="n_t" /> + <ngram occurrences="10" value="n_st" /> + <ngram occurrences="10" value="n_g" /> + <ngram occurrences="10" value="n_b" /> + <ngram occurrences="10" value="m_" /> + <ngram occurrences="10" value="len" /> + <ngram occurrences="10" value="iet" /> + <ngram occurrences="10" value="ich" /> + <ngram occurrences="10" value="gr" /> + <ngram occurrences="10" value="est" /> + <ngram occurrences="10" value="ep" /> + <ngram occurrences="10" value="em" /> + <ngram occurrences="10" value="eke" /> + <ngram occurrences="10" value="e_h" /> + <ngram occurrences="10" value="die_" /> + <ngram occurrences="10" value="dente" /> + <ngram occurrences="10" value="_nie" /> + <ngram occurrences="10" value="_ni" /> + <ngram occurrences="10" value="_er" /> + <ngram occurrences="10" value="_di" /> + <ngram occurrences="9" value="van_d" /> + <ngram occurrences="9" value="ur" /> + <ngram occurrences="9" value="uit" /> + <ngram occurrences="9" value="tr" /> + <ngram occurrences="9" value="t_h" /> + <ngram occurrences="9" value="rk" /> + <ngram occurrences="9" value="nten" /> + <ngram occurrences="9" value="nn" /> + <ngram occurrences="9" value="niet" /> + <ngram occurrences="9" value="ngen" /> + <ngram occurrences="9" value="na" /> + <ngram occurrences="9" value="n_i" /> + <ngram occurrences="9" value="n_he" /> + <ngram occurrences="9" value="mi" /> + <ngram occurrences="9" value="kr" /> + <ngram occurrences="9" value="is_" /> + <ngram occurrences="9" value="ig" /> + <ngram occurrences="9" value="iet_" /> + <ngram occurrences="9" value="hu" /> + <ngram occurrences="9" value="ev" /> + <ngram occurrences="9" value="ere" /> + <ngram occurrences="9" value="enten" /> + <ngram occurrences="9" value="en_e" /> + <ngram occurrences="9" value="elijk" /> + <ngram occurrences="9" value="elij" /> + <ngram occurrences="9" value="eli" /> + <ngram occurrences="9" value="ele" /> + <ngram occurrences="9" value="ege" /> + <ngram occurrences="9" value="eb" /> + <ngram occurrences="9" value="e_va" /> + <ngram occurrences="9" value="e_s" /> + <ngram occurrences="9" value="e_d" /> + <ngram occurrences="9" value="do" /> + <ngram occurrences="9" value="der_" /> + <ngram occurrences="9" value="ba" /> + <ngram occurrences="9" value="as" /> + <ngram occurrences="9" value="_zo" /> + <ngram occurrences="9" value="_we" /> + <ngram occurrences="9" value="_wa" /> + <ngram occurrences="9" value="_niet" /> + <ngram occurrences="9" value="_le" /> + <ngram occurrences="9" value="_aa" /> + <ngram occurrences="8" value="wi" /> + <ngram occurrences="8" value="ven" /> + <ngram occurrences="8" value="us" /> + <ngram occurrences="8" value="ts" /> + <ngram occurrences="8" value="tij" /> + <ngram occurrences="8" value="se_" /> + <ngram occurrences="8" value="rij" /> + <ngram occurrences="8" value="ren" /> + <ngram occurrences="8" value="r_z" /> + <ngram occurrences="8" value="pe" /> + <ngram occurrences="8" value="ond" /> + <ngram occurrences="8" value="og" /> + <ngram occurrences="8" value="nten_" /> + <ngram occurrences="8" value="no" /> + <ngram occurrences="8" value="ning" /> + <ngram occurrences="8" value="nin" /> + <ngram occurrences="8" value="niet_" /> + <ngram occurrences="8" value="ngen_" /> + <ngram occurrences="8" value="nd_" /> + <ngram occurrences="8" value="n_vo" /> + <ngram occurrences="8" value="n_stu" /> + <ngram occurrences="8" value="n_in" /> + <ngram occurrences="8" value="n_ge" /> + <ngram occurrences="8" value="n_be" /> + <ngram occurrences="8" value="met_" /> + <ngram occurrences="8" value="met" /> + <ngram occurrences="8" value="lle" /> + <ngram occurrences="8" value="len_" /> + <ngram occurrences="8" value="ker" /> + <ngram occurrences="8" value="ken" /> + <ngram occurrences="8" value="jd" /> + <ngram occurrences="8" value="j_" /> + <ngram occurrences="8" value="it_" /> + <ngram occurrences="8" value="ingen" /> + <ngram occurrences="8" value="ik" /> + <ngram occurrences="8" value="ijd" /> + <ngram occurrences="8" value="ij_" /> + <ngram occurrences="8" value="h_" /> + <ngram occurrences="8" value="gro" /> + <ngram occurrences="8" value="g_v" /> + <ngram occurrences="8" value="even" /> + <ngram occurrences="8" value="eve" /> + <ngram occurrences="8" value="end" /> + <ngram occurrences="8" value="en_zi" /> + <ngram occurrences="8" value="eerd" /> + <ngram occurrences="8" value="ede" /> + <ngram occurrences="8" value="e_van" /> + <ngram occurrences="8" value="e_st" /> + <ngram occurrences="8" value="e_b" /> + <ngram occurrences="8" value="ch_" /> + <ngram occurrences="8" value="bi" /> +</ngrams> diff --git a/src/plugins/language/english.klp b/src/plugins/language/english.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="619" value="_" /> + <ngram occurrences="461" value="e" /> + <ngram occurrences="304" value="t" /> + <ngram occurrences="250" value="n" /> + <ngram occurrences="238" value="i" /> + <ngram occurrences="234" value="a" /> + <ngram occurrences="215" value="o" /> + <ngram occurrences="209" value="s" /> + <ngram occurrences="194" value="r" /> + <ngram occurrences="147" value="h" /> + <ngram occurrences="144" value="e_" /> + <ngram occurrences="119" value="d" /> + <ngram occurrences="116" value="_t" /> + <ngram occurrences="106" value="c" /> + <ngram occurrences="98" value="th" /> + <ngram occurrences="94" value="s_" /> + <ngram occurrences="90" value="l" /> + <ngram occurrences="90" value="he" /> + <ngram occurrences="88" value="_th" /> + <ngram occurrences="86" value="_a" /> + <ngram occurrences="81" value="m" /> + <ngram occurrences="81" value="f" /> + <ngram occurrences="79" value="the" /> + <ngram occurrences="78" value="u" /> + <ngram occurrences="73" value="_the" /> + <ngram occurrences="68" value="p" /> + <ngram occurrences="65" value="he_" /> + <ngram occurrences="65" value="er" /> + <ngram occurrences="63" value="the_" /> + <ngram occurrences="63" value="d_" /> + <ngram occurrences="63" value="_the_" /> + <ngram occurrences="58" value="n_" /> + <ngram occurrences="58" value="in" /> + <ngram occurrences="56" value="_o" /> + <ngram occurrences="55" value="on" /> + <ngram occurrences="55" value="en" /> + <ngram occurrences="54" value="re" /> + <ngram occurrences="54" value="_i" /> + <ngram occurrences="53" value="y" /> + <ngram occurrences="52" value="t_" /> + <ngram occurrences="49" value="b" /> + <ngram occurrences="48" value="g" /> + <ngram occurrences="46" value="v" /> + <ngram occurrences="45" value="an" /> + <ngram occurrences="44" value="es" /> + <ngram occurrences="43" value="y_" /> + <ngram occurrences="43" value="w" /> + <ngram occurrences="41" value="ti" /> + <ngram occurrences="40" value="nd" /> + <ngram occurrences="38" value="f_" /> + <ngram occurrences="37" value="r_" /> + <ngram occurrences="37" value="of_" /> + <ngram occurrences="37" value="of" /> + <ngram occurrences="37" value="_of_" /> + <ngram occurrences="37" value="_of" /> + <ngram occurrences="35" value="io" /> + <ngram occurrences="35" value="at" /> + <ngram occurrences="35" value="_w" /> + <ngram occurrences="35" value="_in" /> + <ngram occurrences="34" value="nt" /> + <ngram occurrences="33" value="ve" /> + <ngram occurrences="33" value="me" /> + <ngram occurrences="32" value="ed" /> + <ngram occurrences="31" value="ion" /> + <ngram occurrences="31" value="de" /> + <ngram occurrences="31" value="_p" /> + <ngram occurrences="30" value="on_" /> + <ngram occurrences="29" value="_an" /> + <ngram occurrences="28" value="se" /> + <ngram occurrences="28" value="nd_" /> + <ngram occurrences="28" value="it" /> + <ngram occurrences="28" value="and" /> + <ngram occurrences="27" value="ns" /> + <ngram occurrences="27" value="and_" /> + <ngram occurrences="27" value="_and_" /> + <ngram occurrences="27" value="_and" /> + <ngram occurrences="26" value="st" /> + <ngram occurrences="26" value="ed_" /> + <ngram occurrences="26" value="ar" /> + <ngram occurrences="24" value="s_a" /> + <ngram occurrences="24" value="ion_" /> + <ngram occurrences="24" value="ha" /> + <ngram occurrences="24" value="_s" /> + <ngram occurrences="24" value="_m" /> + <ngram occurrences="23" value="to" /> + <ngram occurrences="23" value="or" /> + <ngram occurrences="23" value="o_" /> + <ngram occurrences="23" value="is" /> + <ngram occurrences="23" value="ent" /> + <ngram occurrences="23" value="_b" /> + <ngram occurrences="22" value="ic" /> + <ngram occurrences="22" value="er_" /> + <ngram occurrences="22" value="ea" /> + <ngram occurrences="22" value="_c" /> + <ngram occurrences="21" value="to_" /> + <ngram occurrences="21" value="le" /> + <ngram occurrences="21" value="es_" /> + <ngram occurrences="21" value="_to" /> + <ngram occurrences="21" value="_d" /> + <ngram occurrences="20" value="te" /> + <ngram occurrences="20" value="ie" /> + <ngram occurrences="20" value="ci" /> + <ngram occurrences="20" value="be" /> + <ngram occurrences="20" value="_to_" /> + <ngram occurrences="19" value="tio" /> + <ngram occurrences="19" value="al" /> + <ngram occurrences="19" value="_f" /> + <ngram occurrences="18" value="ty" /> + <ngram occurrences="18" value="tion" /> + <ngram occurrences="18" value="of_th" /> + <ngram occurrences="18" value="of_t" /> + <ngram occurrences="18" value="men" /> + <ngram occurrences="18" value="in_" /> + <ngram occurrences="18" value="f_th" /> + <ngram occurrences="18" value="f_t" /> + <ngram occurrences="18" value="ec" /> + <ngram occurrences="18" value="_of_t" /> + <ngram occurrences="17" value="s_t" /> + <ngram occurrences="17" value="ng" /> + <ngram occurrences="17" value="hi" /> + <ngram occurrences="17" value="e_t" /> + <ngram occurrences="17" value="ct" /> + <ngram occurrences="17" value="ce" /> + <ngram occurrences="17" value="as" /> + <ngram occurrences="17" value="a_" /> + <ngram occurrences="17" value="_h" /> + <ngram occurrences="17" value="_e" /> + <ngram occurrences="16" value="ra" /> + <ngram occurrences="16" value="pr" /> + <ngram occurrences="16" value="pe" /> + <ngram occurrences="16" value="ou" /> + <ngram occurrences="16" value="f_the" /> + <ngram occurrences="16" value="e_a" /> + <ngram occurrences="16" value="co" /> + <ngram occurrences="16" value="_de" /> + <ngram occurrences="15" value="ts" /> + <ngram occurrences="15" value="ss" /> + <ngram occurrences="15" value="s_o" /> + <ngram occurrences="15" value="ro" /> + <ngram occurrences="15" value="ri" /> + <ngram occurrences="15" value="ns_" /> + <ngram occurrences="15" value="nc" /> + <ngram occurrences="15" value="l_" /> + <ngram occurrences="15" value="_r" /> + <ngram occurrences="15" value="_co" /> + <ngram occurrences="14" value="ts_" /> + <ngram occurrences="14" value="tion_" /> + <ngram occurrences="14" value="rt" /> + <ngram occurrences="14" value="re_" /> + <ngram occurrences="14" value="pa" /> + <ngram occurrences="14" value="n_t" /> + <ngram occurrences="14" value="_a_" /> + <ngram occurrences="13" value="ver" /> + <ngram occurrences="13" value="ve_" /> + <ngram occurrences="13" value="un" /> + <ngram occurrences="13" value="ty_" /> + <ngram occurrences="13" value="s_and" /> + <ngram occurrences="13" value="s_an" /> + <ngram occurrences="13" value="ng_" /> + <ngram occurrences="13" value="n_th" /> + <ngram occurrences="13" value="ment" /> + <ngram occurrences="13" value="li" /> + <ngram occurrences="13" value="il" /> + <ngram occurrences="13" value="g_" /> + <ngram occurrences="13" value="em" /> + <ngram occurrences="13" value="e_o" /> + <ngram occurrences="13" value="e_m" /> + <ngram occurrences="13" value="d_t" /> + <ngram occurrences="13" value="at_" /> + <ngram occurrences="13" value="ac" /> + <ngram occurrences="13" value="_re" /> + <ngram occurrences="13" value="_in_" /> + <ngram occurrences="13" value="_g" /> + <ngram occurrences="12" value="we" /> + <ngram occurrences="12" value="ta" /> + <ngram occurrences="12" value="s_th" /> + <ngram occurrences="12" value="s_of_" /> + <ngram occurrences="12" value="s_of" /> + <ngram occurrences="12" value="nt_" /> + <ngram occurrences="12" value="ne" /> + <ngram occurrences="12" value="ma" /> + <ngram occurrences="12" value="ing" /> + <ngram occurrences="12" value="ent_" /> + <ngram occurrences="12" value="e_p" /> + <ngram occurrences="12" value="di" /> + <ngram occurrences="12" value="ch" /> + <ngram occurrences="12" value="ad" /> + <ngram occurrences="12" value="_n" /> + <ngram occurrences="11" value="wh" /> + <ngram occurrences="11" value="us" /> + <ngram occurrences="11" value="si" /> + <ngram occurrences="11" value="res" /> + <ngram occurrences="11" value="ons" /> + <ngram occurrences="11" value="is_" /> + <ngram occurrences="11" value="ing_" /> + <ngram occurrences="11" value="es_a" /> + <ngram occurrences="11" value="e_i" /> + <ngram occurrences="11" value="art" /> + <ngram occurrences="11" value="_wh" /> + <ngram occurrences="11" value="_pr" /> + <ngram occurrences="11" value="_be" /> + <ngram occurrences="10" value="tr" /> + <ngram occurrences="10" value="rs" /> + <ngram occurrences="10" value="part" /> + <ngram occurrences="10" value="par" /> + <ngram occurrences="10" value="ov" /> + <ngram occurrences="10" value="nf" /> + <ngram occurrences="10" value="na" /> + <ngram occurrences="10" value="n_the" /> + <ngram occurrences="10" value="ll" /> + <ngram occurrences="10" value="it_" /> + <ngram occurrences="10" value="in_th" /> + <ngram occurrences="10" value="in_t" /> + <ngram occurrences="10" value="hat" /> + <ngram occurrences="10" value="go" /> + <ngram occurrences="10" value="ess" /> + <ngram occurrences="10" value="ere" /> + <ngram occurrences="10" value="ati" /> + <ngram occurrences="10" value="_it" /> + <ngram occurrences="10" value="_ha" /> + <ngram occurrences="9" value="wi" /> + <ngram occurrences="9" value="ue" /> + <ngram occurrences="9" value="thi" /> + <ngram occurrences="9" value="su" /> + <ngram occurrences="9" value="se_" /> + <ngram occurrences="9" value="s_the" /> + <ngram occurrences="9" value="ove" /> + <ngram occurrences="9" value="ni" /> + <ngram occurrences="9" value="ies_" /> + <ngram occurrences="9" value="ies" /> + <ngram occurrences="9" value="her" /> + <ngram occurrences="9" value="fo" /> + <ngram occurrences="9" value="et" /> + <ngram occurrences="9" value="e_th" /> + <ngram occurrences="9" value="e_f" /> + <ngram occurrences="9" value="der" /> + <ngram occurrences="9" value="d_th" /> + <ngram occurrences="9" value="d_a" /> + <ngram occurrences="9" value="by_" /> + <ngram occurrences="9" value="by" /> + <ngram occurrences="9" value="ab" /> + <ngram occurrences="9" value="_wi" /> + <ngram occurrences="9" value="_we" /> + <ngram occurrences="9" value="_un" /> + <ngram occurrences="9" value="_u" /> + <ngram occurrences="9" value="_pa" /> + <ngram occurrences="9" value="_ma" /> + <ngram occurrences="9" value="_by_" /> + <ngram occurrences="9" value="_by" /> + <ngram occurrences="9" value="_as" /> + <ngram occurrences="8" value="to_t" /> + <ngram occurrences="8" value="tha" /> + <ngram occurrences="8" value="t_t" /> + <ngram occurrences="8" value="st_" /> + <ngram occurrences="8" value="rn" /> + <ngram occurrences="8" value="pro" /> + <ngram occurrences="8" value="over" /> + <ngram occurrences="8" value="op" /> + <ngram occurrences="8" value="ons_" /> + <ngram occurrences="8" value="o_t" /> + <ngram occurrences="8" value="n_o" /> + <ngram occurrences="8" value="n_i" /> + <ngram occurrences="8" value="ment_" /> + <ngram occurrences="8" value="ll_" /> + <ngram occurrences="8" value="le_" /> + <ngram occurrences="8" value="iv" /> + <ngram occurrences="8" value="ir" /> + <ngram occurrences="8" value="her_" /> + <ngram occurrences="8" value="hat_" /> + <ngram occurrences="8" value="h_" /> + <ngram occurrences="8" value="ern" /> + <ngram occurrences="8" value="ei" /> + <ngram occurrences="8" value="ee" /> + <ngram occurrences="8" value="e_s" /> + <ngram occurrences="8" value="e_in" /> + <ngram occurrences="8" value="con" /> + <ngram occurrences="8" value="ce_" /> + <ngram occurrences="8" value="bl" /> + <ngram occurrences="8" value="be_" /> + <ngram occurrences="8" value="av" /> + <ngram occurrences="8" value="ation" /> + <ngram occurrences="8" value="atio" /> + <ngram occurrences="8" value="as_" /> + <ngram occurrences="8" value="am" /> + <ngram occurrences="8" value="_v" /> + <ngram occurrences="8" value="_tha" /> + <ngram occurrences="8" value="_pro" /> + <ngram occurrences="8" value="_l" /> + <ngram occurrences="8" value="_it_" /> + <ngram occurrences="8" value="_go" /> + <ngram occurrences="8" value="_con" /> + <ngram occurrences="8" value="_at" /> + <ngram occurrences="8" value="_as_" /> + <ngram occurrences="7" value="y_o" /> + <ngram occurrences="7" value="y_a" /> + <ngram occurrences="7" value="vernm" /> + <ngram occurrences="7" value="vern" /> + <ngram occurrences="7" value="ur" /> + <ngram occurrences="7" value="to_th" /> + <ngram occurrences="7" value="that_" /> + <ngram occurrences="7" value="that" /> + <ngram occurrences="7" value="so" /> + <ngram occurrences="7" value="sion" /> + <ngram occurrences="7" value="sio" /> + <ngram occurrences="7" value="rs_" /> + <ngram occurrences="7" value="rnmen" /> + <ngram occurrences="7" value="rnme" /> + <ngram occurrences="7" value="rnm" /> + <ngram occurrences="7" value="rea" /> + <ngram occurrences="7" value="per" /> + <ngram occurrences="7" value="overn" /> + <ngram occurrences="7" value="ot" /> + <ngram occurrences="7" value="os" /> + <ngram occurrences="7" value="on_o" /> + <ngram occurrences="7" value="on_i" /> + <ngram occurrences="7" value="o_the" /> + <ngram occurrences="7" value="o_th" /> + <ngram occurrences="7" value="nts_" /> + <ngram occurrences="7" value="nts" /> + <ngram occurrences="7" value="nment" /> + <ngram occurrences="7" value="nmen" /> + <ngram occurrences="7" value="nme" /> + <ngram occurrences="7" value="nm" /> + <ngram occurrences="7" value="n_a" /> + <ngram occurrences="7" value="mp" /> + <ngram occurrences="7" value="mo" /> + <ngram occurrences="7" value="k" /> + <ngram occurrences="7" value="j" /> + <ngram occurrences="7" value="ive" /> + <ngram occurrences="7" value="ion_o" /> + <ngram occurrences="7" value="ion_i" /> + <ngram occurrences="7" value="hic" /> + <ngram occurrences="7" value="hav" /> + <ngram occurrences="7" value="gover" /> + <ngram occurrences="7" value="gove" /> + <ngram occurrences="7" value="gov" /> + <ngram occurrences="7" value="for" /> + <ngram occurrences="7" value="fl" /> + <ngram occurrences="7" value="fe" /> + <ngram occurrences="7" value="ers" /> + <ngram occurrences="7" value="ernme" /> + <ngram occurrences="7" value="ernm" /> + <ngram occurrences="7" value="era" /> + <ngram occurrences="7" value="ens" /> + <ngram occurrences="7" value="en_" /> + <ngram occurrences="7" value="eas" /> + <ngram occurrences="7" value="e_the" /> + <ngram occurrences="7" value="d_b" /> + <ngram occurrences="7" value="cti" /> + <ngram occurrences="7" value="cr" /> + <ngram occurrences="7" value="ch_" /> + <ngram occurrences="7" value="al_" /> + <ngram occurrences="7" value="_to_t" /> + <ngram occurrences="7" value="_that" /> + <ngram occurrences="7" value="_on" /> + <ngram occurrences="7" value="_me" /> + <ngram occurrences="7" value="_le" /> + <ngram occurrences="7" value="_in_t" /> + <ngram occurrences="7" value="_hav" /> + <ngram occurrences="7" value="_gove" /> + <ngram occurrences="7" value="_gov" /> + <ngram occurrences="7" value="_fo" /> + <ngram occurrences="7" value="_be_" /> + <ngram occurrences="6" value="y_i" /> + <ngram occurrences="6" value="x" /> + <ngram occurrences="6" value="whi" /> + <ngram occurrences="6" value="vi" /> + <ngram occurrences="6" value="va" /> + <ngram occurrences="6" value="ut" /> + <ngram occurrences="6" value="uni" /> + <ngram occurrences="6" value="uen" /> + <ngram occurrences="6" value="ub" /> + <ngram occurrences="6" value="tu" /> + <ngram occurrences="6" value="ts_t" /> + <ngram occurrences="6" value="ties_" /> + <ngram occurrences="6" value="ties" /> + <ngram occurrences="6" value="tie" /> + <ngram occurrences="6" value="the_s" /> + <ngram occurrences="6" value="the_p" /> + <ngram occurrences="6" value="the_m" /> + <ngram occurrences="6" value="the_i" /> + <ngram occurrences="6" value="the_a" /> + <ngram occurrences="6" value="ted_" /> + <ngram occurrences="6" value="ted" /> + <ngram occurrences="6" value="t_w" /> + <ngram occurrences="6" value="t_i" /> + <ngram occurrences="6" value="str" /> + <ngram occurrences="6" value="sp" /> + <ngram occurrences="6" value="sed_" /> + <ngram occurrences="6" value="sed" /> + <ngram occurrences="6" value="s_w" /> + <ngram occurrences="6" value="r_i" /> + <ngram occurrences="6" value="or_" /> + <ngram occurrences="6" value="on_of" /> + <ngram occurrences="6" value="om" /> + <ngram occurrences="6" value="ng_t" /> + <ngram occurrences="6" value="nfl" /> + <ngram occurrences="6" value="nce" /> + <ngram occurrences="6" value="n_w" /> + <ngram occurrences="6" value="n_of_" /> +</ngrams> diff --git a/src/plugins/language/esperanto.klp b/src/plugins/language/esperanto.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="791" value="_" /> + <ngram occurrences="479" value="a" /> + <ngram occurrences="374" value="i" /> + <ngram occurrences="345" value="o" /> + <ngram occurrences="334" value="e" /> + <ngram occurrences="313" value="n" /> + <ngram occurrences="233" value="s" /> + <ngram occurrences="230" value="l" /> + <ngram occurrences="201" value="r" /> + <ngram occurrences="189" value="t" /> + <ngram occurrences="140" value="k" /> + <ngram occurrences="116" value="p" /> + <ngram occurrences="115" value="u" /> + <ngram occurrences="115" value="j" /> + <ngram occurrences="111" value="a_" /> + <ngram occurrences="109" value="o_" /> + <ngram occurrences="108" value="m" /> + <ngram occurrences="106" value="n_" /> + <ngram occurrences="102" value="d" /> + <ngram occurrences="100" value="s_" /> + <ngram occurrences="88" value="e_" /> + <ngram occurrences="86" value="la" /> + <ngram occurrences="79" value="_k" /> + <ngram occurrences="78" value="_l" /> + <ngram occurrences="77" value="i_" /> + <ngram occurrences="71" value="j_" /> + <ngram occurrences="67" value="_p" /> + <ngram occurrences="66" value="g" /> + <ngram occurrences="64" value="v" /> + <ngram occurrences="64" value="on" /> + <ngram occurrences="62" value="la_" /> + <ngram occurrences="62" value="an" /> + <ngram occurrences="58" value="_s" /> + <ngram occurrences="58" value="_n" /> + <ngram occurrences="58" value="_la" /> + <ngram occurrences="56" value="aj" /> + <ngram occurrences="55" value="as" /> + <ngram occurrences="55" value="_a" /> + <ngram occurrences="54" value="en" /> + <ngram occurrences="54" value="_e" /> + <ngram occurrences="52" value="c" /> + <ngram occurrences="52" value="_la_" /> + <ngram occurrences="51" value="ta" /> + <ngram occurrences="50" value="al" /> + <ngram occurrences="47" value="as_" /> + <ngram occurrences="47" value="_t" /> + <ngram occurrences="45" value="b" /> + <ngram occurrences="45" value="_m" /> + <ngram occurrences="44" value="is" /> + <ngram occurrences="42" value="ti" /> + <ngram occurrences="42" value="f" /> + <ngram occurrences="42" value="_d" /> + <ngram occurrences="41" value="ra" /> + <ngram occurrences="40" value="on_" /> + <ngram occurrences="39" value="ro" /> + <ngram occurrences="39" value="aj_" /> + <ngram occurrences="38" value="is_" /> + <ngram occurrences="37" value="ka" /> + <ngram occurrences="36" value="de" /> + <ngram occurrences="35" value="st" /> + <ngram occurrences="35" value="ne" /> + <ngram occurrences="35" value="er" /> + <ngram occurrences="34" value="ri" /> + <ngram occurrences="33" value="oj" /> + <ngram occurrences="33" value="io" /> + <ngram occurrences="33" value="ia" /> + <ngram occurrences="32" value="or" /> + <ngram occurrences="31" value="ø" /> + <ngram occurrences="31" value="es" /> + <ngram occurrences="30" value="te" /> + <ngram occurrences="30" value="ni" /> + <ngram occurrences="30" value="mi" /> + <ngram occurrences="30" value="ma" /> + <ngram occurrences="30" value="li" /> + <ngram occurrences="28" value="æ" /> + <ngram occurrences="28" value="to" /> + <ngram occurrences="28" value="re" /> + <ngram occurrences="28" value="pr" /> + <ngram occurrences="28" value="ko" /> + <ngram occurrences="28" value="_ne" /> + <ngram occurrences="27" value="si" /> + <ngram occurrences="27" value="oj_" /> + <ngram occurrences="27" value="no" /> + <ngram occurrences="27" value="lo" /> + <ngram occurrences="27" value="el" /> + <ngram occurrences="26" value="in" /> + <ngram occurrences="26" value="_ka" /> + <ngram occurrences="26" value="_i" /> + <ngram occurrences="25" value="x" /> + <ngram occurrences="25" value="l_" /> + <ngram occurrences="25" value="_ti" /> + <ngram occurrences="24" value="vi" /> + <ngram occurrences="24" value="nt" /> + <ngram occurrences="24" value="ci" /> + <ngram occurrences="24" value="_pr" /> + <ngram occurrences="24" value="_de" /> + <ngram occurrences="23" value="na" /> + <ngram occurrences="23" value="ig" /> + <ngram occurrences="22" value="u_" /> + <ngram occurrences="22" value="po" /> + <ngram occurrences="22" value="ar" /> + <ngram occurrences="22" value="an_" /> + <ngram occurrences="22" value="_v" /> + <ngram occurrences="21" value="ý" /> + <ngram occurrences="21" value="z" /> + <ngram occurrences="21" value="de_" /> + <ngram occurrences="21" value="aý" /> + <ngram occurrences="21" value="_r" /> + <ngram occurrences="21" value="_b" /> + <ngram occurrences="20" value="kaj_" /> + <ngram occurrences="20" value="kaj" /> + <ngram occurrences="20" value="jn" /> + <ngram occurrences="20" value="io_" /> + <ngram occurrences="20" value="h" /> + <ngram occurrences="20" value="_mi" /> + <ngram occurrences="20" value="_ma" /> + <ngram occurrences="19" value="un" /> + <ngram occurrences="19" value="sta" /> + <ngram occurrences="19" value="nd" /> + <ngram occurrences="19" value="mal" /> + <ngram occurrences="19" value="est" /> + <ngram occurrences="19" value="_de_" /> + <ngram occurrences="18" value="ne_" /> + <ngram occurrences="18" value="le" /> + <ngram occurrences="18" value="il" /> + <ngram occurrences="18" value="at" /> + <ngram occurrences="18" value="_æ" /> + <ngram occurrences="18" value="_mal" /> + <ngram occurrences="18" value="_kaj_" /> + <ngram occurrences="18" value="_kaj" /> + <ngram occurrences="18" value="_al" /> + <ngram occurrences="17" value="se" /> + <ngram occurrences="17" value="pa" /> + <ngram occurrences="17" value="ov" /> + <ngram occurrences="17" value="o_d" /> + <ngram occurrences="17" value="do" /> + <ngram occurrences="17" value="di" /> + <ngram occurrences="17" value="_ne_" /> + <ngram occurrences="16" value="tr" /> + <ngram occurrences="16" value="tas" /> + <ngram occurrences="16" value="ro_" /> + <ngram occurrences="16" value="pe" /> + <ngram occurrences="16" value="om" /> + <ngram occurrences="16" value="am" /> + <ngram occurrences="16" value="_vi" /> + <ngram occurrences="16" value="_se" /> + <ngram occurrences="16" value="_o" /> + <ngram occurrences="16" value="_ko" /> + <ngram occurrences="16" value="_est" /> + <ngram occurrences="16" value="_es" /> + <ngram occurrences="15" value="va" /> + <ngram occurrences="15" value="tu" /> + <ngram occurrences="15" value="tas_" /> + <ngram occurrences="15" value="s_k" /> + <ngram occurrences="15" value="r_" /> + <ngram occurrences="15" value="ki" /> + <ngram occurrences="15" value="iu" /> + <ngram occurrences="15" value="gr" /> + <ngram occurrences="15" value="gi" /> + <ngram occurrences="15" value="en_" /> + <ngram occurrences="15" value="_h" /> + <ngram occurrences="15" value="_en" /> + <ngram occurrences="14" value="te_" /> + <ngram occurrences="14" value="pl" /> + <ngram occurrences="14" value="ol" /> + <ngram occurrences="14" value="n_l" /> + <ngram occurrences="14" value="id" /> + <ngram occurrences="14" value="ek" /> + <ngram occurrences="14" value="al_" /> + <ngram occurrences="14" value="a_k" /> + <ngram occurrences="14" value="_po" /> + <ngram occurrences="14" value="_ki" /> + <ngram occurrences="14" value="_g" /> + <ngram occurrences="14" value="_f" /> + <ngram occurrences="14" value="_al_" /> + <ngram occurrences="13" value="þ" /> + <ngram occurrences="13" value="ur" /> + <ngram occurrences="13" value="stas_" /> + <ngram occurrences="13" value="stas" /> + <ngram occurrences="13" value="pro" /> + <ngram occurrences="13" value="ok" /> + <ngram occurrences="13" value="o_k" /> + <ngram occurrences="13" value="mi_" /> + <ngram occurrences="13" value="jn_" /> + <ngram occurrences="13" value="ie" /> + <ngram occurrences="13" value="e_l" /> + <ngram occurrences="13" value="ajn" /> + <ngram occurrences="13" value="_en_" /> + <ngram occurrences="12" value="ý_" /> + <ngram occurrences="12" value="ve" /> + <ngram occurrences="12" value="to_" /> + <ngram occurrences="12" value="n_la" /> + <ngram occurrences="12" value="n_k" /> + <ngram occurrences="12" value="me" /> + <ngram occurrences="12" value="kt" /> + <ngram occurrences="12" value="im" /> + <ngram occurrences="12" value="esta" /> + <ngram occurrences="12" value="da" /> + <ngram occurrences="12" value="aý_" /> + <ngram occurrences="12" value="ag" /> + <ngram occurrences="12" value="_pro" /> + <ngram occurrences="12" value="_ni" /> + <ngram occurrences="11" value="tio" /> + <ngram occurrences="11" value="so" /> + <ngram occurrences="11" value="s_a" /> + <ngram occurrences="11" value="ran" /> + <ngram occurrences="11" value="os" /> + <ngram occurrences="11" value="o_p" /> + <ngram occurrences="11" value="o_de" /> + <ngram occurrences="11" value="n_p" /> + <ngram occurrences="11" value="lu" /> + <ngram occurrences="11" value="lo_" /> + <ngram occurrences="11" value="li_" /> + <ngram occurrences="11" value="ku" /> + <ngram occurrences="11" value="iø" /> + <ngram occurrences="11" value="it" /> + <ngram occurrences="11" value="ia_" /> + <ngram occurrences="11" value="ga" /> + <ngram occurrences="11" value="fo" /> + <ngram occurrences="11" value="estas" /> + <ngram occurrences="11" value="bo" /> + <ngram occurrences="11" value="ant" /> + <ngram occurrences="11" value="a_n" /> + <ngram occurrences="11" value="_tio" /> + <ngram occurrences="11" value="_pl" /> + <ngram occurrences="11" value="_pa" /> + <ngram occurrences="11" value="_no" /> + <ngram occurrences="11" value="_mi_" /> + <ngram occurrences="11" value="_j" /> + <ngram occurrences="10" value="øi" /> + <ngram occurrences="10" value="ta_" /> + <ngram occurrences="10" value="rt" /> + <ngram occurrences="10" value="pre" /> + <ngram occurrences="10" value="por" /> + <ngram occurrences="10" value="o_s" /> + <ngram occurrences="10" value="o_n" /> + <ngram occurrences="10" value="ni_" /> + <ngram occurrences="10" value="n_la_" /> + <ngram occurrences="10" value="mp" /> + <ngram occurrences="10" value="m_" /> + <ngram occurrences="10" value="ks" /> + <ngram occurrences="10" value="ke" /> + <ngram occurrences="10" value="ir" /> + <ngram occurrences="10" value="ik" /> + <ngram occurrences="10" value="i_p" /> + <ngram occurrences="10" value="fe" /> + <ngram occurrences="10" value="ec" /> + <ngram occurrences="10" value="e_e" /> + <ngram occurrences="10" value="du" /> + <ngram occurrences="10" value="ce" /> + <ngram occurrences="10" value="ab" /> + <ngram occurrences="10" value="_ø" /> + <ngram occurrences="10" value="_si" /> + <ngram occurrences="10" value="_li" /> + <ngram occurrences="10" value="_an" /> + <ngram occurrences="9" value="øo" /> + <ngram occurrences="9" value="æi" /> + <ngram occurrences="9" value="xi" /> + <ngram occurrences="9" value="ter" /> + <ngram occurrences="9" value="su" /> + <ngram occurrences="9" value="sa" /> + <ngram occurrences="9" value="res" /> + <ngram occurrences="9" value="op" /> + <ngram occurrences="9" value="on_k" /> + <ngram occurrences="9" value="o_e" /> + <ngram occurrences="9" value="o_de_" /> + <ngram occurrences="9" value="nte" /> + <ngram occurrences="9" value="nk" /> + <ngram occurrences="9" value="nc" /> + <ngram occurrences="9" value="n_n" /> + <ngram occurrences="9" value="mo" /> + <ngram occurrences="9" value="la_k" /> + <ngram occurrences="9" value="kon" /> + <ngram occurrences="9" value="j_p" /> + <ngram occurrences="9" value="is_k" /> + <ngram occurrences="9" value="igi" /> + <ngram occurrences="9" value="i_k" /> + <ngram occurrences="9" value="ho" /> + <ngram occurrences="9" value="gx" /> + <ngram occurrences="9" value="gra" /> + <ngram occurrences="9" value="el_" /> + <ngram occurrences="9" value="ed" /> + <ngram occurrences="9" value="d_" /> + <ngram occurrences="9" value="a_t" /> + <ngram occurrences="9" value="a_p" /> + <ngram occurrences="9" value="_su" /> + <ngram occurrences="9" value="_re" /> + <ngram occurrences="9" value="_esta" /> + <ngram occurrences="8" value="un_" /> + <ngram occurrences="8" value="ul" /> + <ngram occurrences="8" value="tio_" /> + <ngram occurrences="8" value="ova" /> + <ngram occurrences="8" value="nov" /> + <ngram occurrences="8" value="no_" /> + <ngram occurrences="8" value="na_" /> + <ngram occurrences="8" value="n_t" /> + <ngram occurrences="8" value="men" /> + <ngram occurrences="8" value="jo" /> + <ngram occurrences="8" value="iaj_" /> + <ngram occurrences="8" value="iaj" /> + <ngram occurrences="8" value="i_a" /> + <ngram occurrences="8" value="em" /> + <ngram occurrences="8" value="ekt" /> + <ngram occurrences="8" value="e_la_" /> + <ngram occurrences="8" value="e_la" /> + <ngram occurrences="8" value="bl" /> + <ngram occurrences="8" value="ap" /> + <ngram occurrences="8" value="ac" /> + <ngram occurrences="8" value="a_s" /> + <ngram occurrences="8" value="_þ" /> + <ngram occurrences="8" value="_tio_" /> + <ngram occurrences="8" value="_pre" /> + <ngram occurrences="8" value="_por" /> + <ngram occurrences="8" value="_li_" /> + <ngram occurrences="8" value="_ke" /> + <ngram occurrences="8" value="_aý" /> + <ngram occurrences="7" value="øi_" /> + <ngram occurrences="7" value="øa" /> + <ngram occurrences="7" value="vo" /> + <ngram occurrences="7" value="ut" /> + <ngram occurrences="7" value="us" /> + <ngram occurrences="7" value="tra" /> + <ngram occurrences="7" value="sp" /> + <ngram occurrences="7" value="sim" /> + <ngram occurrences="7" value="sci" /> + <ngram occurrences="7" value="sc" /> + <ngram occurrences="7" value="s_m" /> + <ngram occurrences="7" value="s_la" /> + <ngram occurrences="7" value="s_l" /> + <ngram occurrences="7" value="s_e" /> + <ngram occurrences="7" value="s_al" /> + <ngram occurrences="7" value="rd" /> + <ngram occurrences="7" value="por_" /> + <ngram occurrences="7" value="per" /> + <ngram occurrences="7" value="or_" /> + <ngram occurrences="7" value="o_l" /> + <ngram occurrences="7" value="o_ka" /> + <ngram occurrences="7" value="nta" /> + <ngram occurrences="7" value="kom" /> + <ngram occurrences="7" value="ke_" /> + <ngram occurrences="7" value="j_a" /> + <ngram occurrences="7" value="ion_" /> + <ngram occurrences="7" value="ion" /> + <ngram occurrences="7" value="in_" /> + <ngram occurrences="7" value="iel_" /> + <ngram occurrences="7" value="iel" /> + <ngram occurrences="7" value="ide" /> + <ngram occurrences="7" value="ian_" /> + <ngram occurrences="7" value="ian" /> + <ngram occurrences="7" value="i_s" /> + <ngram occurrences="7" value="for" /> + <ngram occurrences="7" value="ev" /> + <ngram occurrences="7" value="et" /> + <ngram occurrences="7" value="enc" /> + <ngram occurrences="7" value="e_t" /> + <ngram occurrences="7" value="do_" /> + <ngram occurrences="7" value="cio" /> + <ngram occurrences="7" value="as_a" /> + <ngram occurrences="7" value="anta" /> + <ngram occurrences="7" value="ank" /> + <ngram occurrences="7" value="ala" /> + <ngram occurrences="7" value="aci" /> + <ngram occurrences="7" value="_øi" /> + <ngram occurrences="7" value="_æi" /> + <ngram occurrences="7" value="_por_" /> + <ngram occurrences="7" value="_ku" /> + <ngram occurrences="7" value="_ke_" /> + <ngram occurrences="7" value="_in" /> + <ngram occurrences="7" value="_ho" /> + <ngram occurrences="7" value="_for" /> + <ngram occurrences="7" value="_fo" /> + <ngram occurrences="6" value="øas_" /> + <ngram occurrences="6" value="øas" /> + <ngram occurrences="6" value="zo" /> + <ngram occurrences="6" value="vid" /> + <ngram occurrences="6" value="vi_" /> + <ngram occurrences="6" value="u_a" /> + <ngram occurrences="6" value="tie" /> + <ngram occurrences="6" value="ti_" /> + <ngram occurrences="6" value="s_la_" /> + <ngram occurrences="6" value="rn" /> + <ngram occurrences="6" value="rm" /> + <ngram occurrences="6" value="rig" /> + <ngram occurrences="6" value="ren" /> + <ngram occurrences="6" value="os_" /> + <ngram occurrences="6" value="ort" /> + <ngram occurrences="6" value="oksi" /> + <ngram occurrences="6" value="oks" /> + <ngram occurrences="6" value="ojn_" /> + <ngram occurrences="6" value="ojn" /> + <ngram occurrences="6" value="of" /> + <ngram occurrences="6" value="o_ne" /> + <ngram occurrences="6" value="o_la_" /> + <ngram occurrences="6" value="o_la" /> + <ngram occurrences="6" value="nu" /> + <ngram occurrences="6" value="nis_" /> + <ngram occurrences="6" value="nis" /> + <ngram occurrences="6" value="lan" /> + <ngram occurrences="6" value="la_s" /> + <ngram occurrences="6" value="la_n" /> +</ngrams> diff --git a/src/plugins/language/estonian.klp b/src/plugins/language/estonian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="744" value="_" /> + <ngram occurrences="537" value="a" /> + <ngram occurrences="436" value="e" /> + <ngram occurrences="385" value="i" /> + <ngram occurrences="330" value="s" /> + <ngram occurrences="275" value="t" /> + <ngram occurrences="255" value="u" /> + <ngram occurrences="242" value="l" /> + <ngram occurrences="211" value="k" /> + <ngram occurrences="200" value="n" /> + <ngram occurrences="181" value="m" /> + <ngram occurrences="173" value="a_" /> + <ngram occurrences="163" value="d" /> + <ngram occurrences="127" value="o" /> + <ngram occurrences="117" value="e_" /> + <ngram occurrences="111" value="r" /> + <ngram occurrences="95" value="_k" /> + <ngram occurrences="94" value="s_" /> + <ngram occurrences="92" value="i_" /> + <ngram occurrences="91" value="v" /> + <ngram occurrences="84" value="h" /> + <ngram occurrences="80" value="g" /> + <ngram occurrences="78" value="p" /> + <ngram occurrences="76" value="d_" /> + <ngram occurrences="73" value="j" /> + <ngram occurrences="72" value="_t" /> + <ngram occurrences="69" value="_m" /> + <ngram occurrences="68" value="se" /> + <ngram occurrences="66" value="ma" /> + <ngram occurrences="65" value="is" /> + <ngram occurrences="64" value="t_" /> + <ngram occurrences="64" value="in" /> + <ngram occurrences="63" value="_s" /> + <ngram occurrences="62" value="ô" /> + <ngram occurrences="62" value="ä" /> + <ngram occurrences="62" value="ta" /> + <ngram occurrences="62" value="as" /> + <ngram occurrences="60" value="st" /> + <ngram occurrences="56" value="te" /> + <ngram occurrences="55" value="_p" /> + <ngram occurrences="53" value="le" /> + <ngram occurrences="52" value="_j" /> + <ngram occurrences="51" value="_v" /> + <ngram occurrences="50" value="si" /> + <ngram occurrences="46" value="ku" /> + <ngram occurrences="46" value="el" /> + <ngram occurrences="46" value="al" /> + <ngram occurrences="46" value="_o" /> + <ngram occurrences="45" value="ja" /> + <ngram occurrences="43" value="va" /> + <ngram occurrences="43" value="es" /> + <ngram occurrences="42" value="li" /> + <ngram occurrences="42" value="_e" /> + <ngram occurrences="41" value="id" /> + <ngram occurrences="40" value="_a" /> + <ngram occurrences="39" value="us" /> + <ngram occurrences="39" value="ud" /> + <ngram occurrences="39" value="ei" /> + <ngram occurrences="39" value="da" /> + <ngram occurrences="38" value="mi" /> + <ngram occurrences="36" value="ü" /> + <ngram occurrences="35" value="ol" /> + <ngram occurrences="35" value="nu" /> + <ngram occurrences="35" value="_n" /> + <ngram occurrences="33" value="u_" /> + <ngram occurrences="33" value="tu" /> + <ngram occurrences="33" value="ka" /> + <ngram occurrences="33" value="ja_" /> + <ngram occurrences="33" value="_ja" /> + <ngram occurrences="31" value="me" /> + <ngram occurrences="31" value="ga" /> + <ngram occurrences="30" value="na" /> + <ngram occurrences="30" value="b" /> + <ngram occurrences="29" value="n_" /> + <ngram occurrences="29" value="em" /> + <ngram occurrences="28" value="st_" /> + <ngram occurrences="28" value="_se" /> + <ngram occurrences="27" value="uu" /> + <ngram occurrences="27" value="ud_" /> + <ngram occurrences="27" value="ra" /> + <ngram occurrences="27" value="l_" /> + <ngram occurrences="27" value="at" /> + <ngram occurrences="26" value="ul" /> + <ngram occurrences="26" value="ma_" /> + <ngram occurrences="26" value="ik" /> + <ngram occurrences="26" value="et" /> + <ngram occurrences="26" value="an" /> + <ngram occurrences="25" value="ne" /> + <ngram occurrences="25" value="ks" /> + <ngram occurrences="25" value="ee" /> + <ngram occurrences="25" value="de" /> + <ngram occurrences="25" value="aa" /> + <ngram occurrences="25" value="a_k" /> + <ngram occurrences="25" value="_ta" /> + <ngram occurrences="25" value="_ja_" /> + <ngram occurrences="25" value="_h" /> + <ngram occurrences="24" value="nud" /> + <ngram occurrences="24" value="_ku" /> + <ngram occurrences="23" value="nud_" /> + <ngram occurrences="23" value="he" /> + <ngram occurrences="23" value="ga_" /> + <ngram occurrences="23" value="as_" /> + <ngram occurrences="23" value="ag" /> + <ngram occurrences="22" value="ni" /> + <ngram occurrences="22" value="le_" /> + <ngram occurrences="22" value="ko" /> + <ngram occurrences="22" value="id_" /> + <ngram occurrences="22" value="am" /> + <ngram occurrences="22" value="_l" /> + <ngram occurrences="21" value="ôi" /> + <ngram occurrences="21" value="är" /> + <ngram occurrences="21" value="te_" /> + <ngram occurrences="21" value="ll" /> + <ngram occurrences="21" value="ke" /> + <ngram occurrences="21" value="_va" /> + <ngram occurrences="21" value="_te" /> + <ngram occurrences="21" value="_mi" /> + <ngram occurrences="20" value="nd" /> + <ngram occurrences="20" value="ii" /> + <ngram occurrences="20" value="ad" /> + <ngram occurrences="20" value="_r" /> + <ngram occurrences="19" value="vô" /> + <ngram occurrences="19" value="sa" /> + <ngram occurrences="19" value="is_" /> + <ngram occurrences="19" value="es_" /> + <ngram occurrences="19" value="a_t" /> + <ngram occurrences="19" value="_vô" /> + <ngram occurrences="18" value="ks_" /> + <ngram occurrences="18" value="ju" /> + <ngram occurrences="18" value="ha" /> + <ngram occurrences="18" value="en" /> + <ngram occurrences="18" value="ast" /> + <ngram occurrences="18" value="ak" /> + <ngram occurrences="18" value="_ol" /> + <ngram occurrences="17" value="ut" /> + <ngram occurrences="17" value="ta_" /> + <ngram occurrences="17" value="pa" /> + <ngram occurrences="17" value="ise" /> + <ngram occurrences="17" value="il" /> + <ngram occurrences="17" value="gi" /> + <ngram occurrences="17" value="eg" /> + <ngram occurrences="17" value="ar" /> + <ngram occurrences="17" value="_si" /> + <ngram occurrences="17" value="_ko" /> + <ngram occurrences="17" value="_ka" /> + <ngram occurrences="16" value="sin" /> + <ngram occurrences="16" value="ne_" /> + <ngram occurrences="16" value="it" /> + <ngram occurrences="16" value="in_" /> + <ngram occurrences="16" value="ed" /> + <ngram occurrences="16" value="ah" /> + <ngram occurrences="16" value="_ma" /> + <ngram occurrences="15" value="ö" /> + <ngram occurrences="15" value="vi" /> + <ngram occurrences="15" value="un" /> + <ngram occurrences="15" value="ui" /> + <ngram occurrences="15" value="sel" /> + <ngram occurrences="15" value="se_" /> + <ngram occurrences="15" value="re" /> + <ngram occurrences="15" value="po" /> + <ngram occurrences="15" value="oo" /> + <ngram occurrences="15" value="ki" /> + <ngram occurrences="15" value="e_k" /> + <ngram occurrences="15" value="da_" /> + <ngram occurrences="15" value="d_j" /> + <ngram occurrences="15" value="a_p" /> + <ngram occurrences="15" value="_i" /> + <ngram occurrences="14" value="vôi" /> + <ngram occurrences="14" value="ts" /> + <ngram occurrences="14" value="su" /> + <ngram occurrences="14" value="ri" /> + <ngram occurrences="14" value="oli" /> + <ngram occurrences="14" value="min" /> + <ngram occurrences="14" value="li_" /> + <ngram occurrences="14" value="la" /> + <ngram occurrences="14" value="kui" /> + <ngram occurrences="14" value="gu" /> + <ngram occurrences="14" value="e_v" /> + <ngram occurrences="14" value="ai" /> + <ngram occurrences="14" value="_vôi" /> + <ngram occurrences="13" value="ust" /> + <ngram occurrences="13" value="oh" /> + <ngram occurrences="13" value="na_" /> + <ngram occurrences="13" value="lu" /> + <ngram occurrences="13" value="lt" /> + <ngram occurrences="13" value="im" /> + <ngram occurrences="13" value="i_t" /> + <ngram occurrences="13" value="gi_" /> + <ngram occurrences="13" value="est" /> + <ngram occurrences="13" value="er" /> + <ngram occurrences="13" value="ei_" /> + <ngram occurrences="13" value="asi" /> + <ngram occurrences="13" value="aga" /> + <ngram occurrences="13" value="a_e" /> + <ngram occurrences="13" value="_ä" /> + <ngram occurrences="13" value="_pa" /> + <ngram occurrences="13" value="_kui" /> + <ngram occurrences="13" value="_ei_" /> + <ngram occurrences="13" value="_ei" /> + <ngram occurrences="12" value="ära" /> + <ngram occurrences="12" value="us_" /> + <ngram occurrences="12" value="sta" /> + <ngram occurrences="12" value="ole" /> + <ngram occurrences="12" value="lt_" /> + <ngram occurrences="12" value="kk" /> + <ngram occurrences="12" value="ist" /> + <ngram occurrences="12" value="ine" /> + <ngram occurrences="12" value="i_s" /> + <ngram occurrences="12" value="ge" /> + <ngram occurrences="12" value="ema" /> + <ngram occurrences="12" value="ele" /> + <ngram occurrences="12" value="eh" /> + <ngram occurrences="12" value="e_m" /> + <ngram occurrences="12" value="av" /> + <ngram occurrences="12" value="a_m" /> + <ngram occurrences="12" value="_tu" /> + <ngram occurrences="12" value="_po" /> + <ngram occurrences="11" value="tt" /> + <ngram occurrences="11" value="tas" /> + <ngram occurrences="11" value="s_t" /> + <ngram occurrences="11" value="s_s" /> + <ngram occurrences="11" value="s_m" /> + <ngram occurrences="11" value="or" /> + <ngram occurrences="11" value="mis" /> + <ngram occurrences="11" value="me_" /> + <ngram occurrences="11" value="lle" /> + <ngram occurrences="11" value="les" /> + <ngram occurrences="11" value="ida" /> + <ngram occurrences="11" value="hel" /> + <ngram occurrences="11" value="et_" /> + <ngram occurrences="11" value="ek" /> + <ngram occurrences="11" value="a_o" /> + <ngram occurrences="11" value="a_a" /> + <ngram occurrences="11" value="_oli" /> + <ngram occurrences="11" value="_me" /> + <ngram occurrences="10" value="u_k" /> + <ngram occurrences="10" value="ste" /> + <ngram occurrences="10" value="sin_" /> + <ngram occurrences="10" value="s_k" /> + <ngram occurrences="10" value="pu" /> + <ngram occurrences="10" value="pi" /> + <ngram occurrences="10" value="ot" /> + <ngram occurrences="10" value="on" /> + <ngram occurrences="10" value="ng" /> + <ngram occurrences="10" value="mu" /> + <ngram occurrences="10" value="lis" /> + <ngram occurrences="10" value="kuu" /> + <ngram occurrences="10" value="inu" /> + <ngram occurrences="10" value="ine_" /> + <ngram occurrences="10" value="ina" /> + <ngram occurrences="10" value="hk" /> + <ngram occurrences="10" value="gu_" /> + <ngram occurrences="10" value="eis" /> + <ngram occurrences="10" value="e_s" /> + <ngram occurrences="10" value="e_p" /> + <ngram occurrences="10" value="d_k" /> + <ngram occurrences="10" value="ava" /> + <ngram occurrences="10" value="aks" /> + <ngram occurrences="10" value="aj" /> + <ngram occurrences="10" value="aga_" /> + <ngram occurrences="10" value="ad_" /> + <ngram occurrences="10" value="a_v" /> + <ngram occurrences="10" value="a_h" /> + <ngram occurrences="10" value="_ü" /> + <ngram occurrences="10" value="_ta_" /> + <ngram occurrences="10" value="_sel" /> + <ngram occurrences="10" value="_ni" /> + <ngram occurrences="10" value="_ju" /> + <ngram occurrences="10" value="_et" /> + <ngram occurrences="9" value="ôt" /> + <ngram occurrences="9" value="ää" /> + <ngram occurrences="9" value="um" /> + <ngram occurrences="9" value="ui_" /> + <ngram occurrences="9" value="tei" /> + <ngram occurrences="9" value="t_k" /> + <ngram occurrences="9" value="s_o" /> + <ngram occurrences="9" value="on_" /> + <ngram occurrences="9" value="oma" /> + <ngram occurrences="9" value="om" /> + <ngram occurrences="9" value="nn" /> + <ngram occurrences="9" value="m_" /> + <ngram occurrences="9" value="kui_" /> + <ngram occurrences="9" value="ka_" /> + <ngram occurrences="9" value="ia" /> + <ngram occurrences="9" value="i_v" /> + <ngram occurrences="9" value="i_m" /> + <ngram occurrences="9" value="hi" /> + <ngram occurrences="9" value="est_" /> + <ngram occurrences="9" value="ell" /> + <ngram occurrences="9" value="el_" /> + <ngram occurrences="9" value="ea" /> + <ngram occurrences="9" value="di" /> + <ngram occurrences="9" value="de_" /> + <ngram occurrences="9" value="d_a" /> + <ngram occurrences="9" value="ast_" /> + <ngram occurrences="9" value="a_s" /> + <ngram occurrences="9" value="a_ku" /> + <ngram occurrences="9" value="_on_" /> + <ngram occurrences="9" value="_on" /> + <ngram occurrences="9" value="_oma" /> + <ngram occurrences="9" value="_om" /> + <ngram occurrences="9" value="_kuu" /> + <ngram occurrences="9" value="_he" /> + <ngram occurrences="9" value="_aga_" /> + <ngram occurrences="9" value="_aga" /> + <ngram occurrences="9" value="_ag" /> + <ngram occurrences="8" value="üü" /> + <ngram occurrences="8" value="ül" /> + <ngram occurrences="8" value="äi" /> + <ngram occurrences="8" value="ve" /> + <ngram occurrences="8" value="uul" /> + <ngram occurrences="8" value="tte" /> + <ngram occurrences="8" value="tas_" /> + <ngram occurrences="8" value="rd" /> + <ngram occurrences="8" value="puu" /> + <ngram occurrences="8" value="pe" /> + <ngram occurrences="8" value="oli_" /> + <ngram occurrences="8" value="nii" /> + <ngram occurrences="8" value="lm" /> + <ngram occurrences="8" value="lg" /> + <ngram occurrences="8" value="ld" /> + <ngram occurrences="8" value="kü" /> + <ngram occurrences="8" value="kô" /> + <ngram occurrences="8" value="ki_" /> + <ngram occurrences="8" value="kas" /> + <ngram occurrences="8" value="ja_k" /> + <ngram occurrences="8" value="ime" /> + <ngram occurrences="8" value="i_n" /> + <ngram occurrences="8" value="ev" /> + <ngram occurrences="8" value="ema_" /> + <ngram occurrences="8" value="elle" /> + <ngram occurrences="8" value="ega" /> + <ngram occurrences="8" value="d_m" /> + <ngram occurrences="8" value="b_" /> + <ngram occurrences="8" value="ami" /> + <ngram occurrences="8" value="ama" /> + <ngram occurrences="8" value="al_" /> + <ngram occurrences="8" value="ae" /> + <ngram occurrences="8" value="ab" /> + <ngram occurrences="8" value="a_l" /> + <ngram occurrences="8" value="_sa" /> + <ngram occurrences="8" value="_nii" /> + <ngram occurrences="8" value="_na" /> + <ngram occurrences="8" value="_mu" /> + <ngram occurrences="8" value="_kô" /> + <ngram occurrences="8" value="_kui_" /> + <ngram occurrences="8" value="_ke" /> + <ngram occurrences="8" value="_ha" /> + <ngram occurrences="8" value="_et_" /> + <ngram occurrences="7" value="üüd" /> + <ngram occurrences="7" value="üd" /> + <ngram occurrences="7" value="ôi_" /> + <ngram occurrences="7" value="vas" /> + <ngram occurrences="7" value="use" /> + <ngram occurrences="7" value="tus" /> + <ngram occurrences="7" value="tul" /> + <ngram occurrences="7" value="tte_" /> + <ngram occurrences="7" value="tl" /> + <ngram occurrences="7" value="t_o" /> + <ngram occurrences="7" value="selle" /> + <ngram occurrences="7" value="sell" /> + <ngram occurrences="7" value="see" /> + <ngram occurrences="7" value="s_p" /> + <ngram occurrences="7" value="roh" /> + <ngram occurrences="7" value="ro" /> + <ngram occurrences="7" value="rk" /> + <ngram occurrences="7" value="ra_" /> + <ngram occurrences="7" value="pol" /> + <ngram occurrences="7" value="nii_" /> + <ngram occurrences="7" value="nde" /> + <ngram occurrences="7" value="lä" /> + <ngram occurrences="7" value="kuul" /> + <ngram occurrences="7" value="ing" /> + <ngram occurrences="7" value="ina_" /> + <ngram occurrences="7" value="ika" /> + <ngram occurrences="7" value="ii_" /> + <ngram occurrences="7" value="hke" /> + <ngram occurrences="7" value="em_" /> + <ngram occurrences="7" value="ega_" /> + <ngram occurrences="7" value="e_va" /> + <ngram occurrences="7" value="e_t" /> + <ngram occurrences="7" value="e_se" /> + <ngram occurrences="7" value="e_r" /> + <ngram occurrences="7" value="du" /> + <ngram occurrences="7" value="d_ja" /> + <ngram occurrences="7" value="ba" /> + <ngram occurrences="7" value="ata" /> + <ngram occurrences="7" value="all" /> + <ngram occurrences="7" value="aks_" /> + <ngram occurrences="7" value="aja" /> + <ngram occurrences="7" value="a_j" /> + <ngram occurrences="7" value="_ô" /> + <ngram occurrences="7" value="_ära" /> + <ngram occurrences="7" value="_är" /> + <ngram occurrences="7" value="_ve" /> + <ngram occurrences="7" value="_tei" /> + <ngram occurrences="7" value="_sell" /> + <ngram occurrences="7" value="_roh" /> + <ngram occurrences="7" value="_ro" /> + <ngram occurrences="7" value="_pu" /> +</ngrams> diff --git a/src/plugins/language/finnish.klp b/src/plugins/language/finnish.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="494" value="_" /> + <ngram occurrences="484" value="a" /> + <ngram occurrences="460" value="i" /> + <ngram occurrences="409" value="t" /> + <ngram occurrences="335" value="n" /> + <ngram occurrences="324" value="e" /> + <ngram occurrences="314" value="s" /> + <ngram occurrences="252" value="l" /> + <ngram occurrences="225" value="k" /> + <ngram occurrences="223" value="o" /> + <ngram occurrences="217" value="u" /> + <ngram occurrences="163" value="ä" /> + <ngram occurrences="159" value="n_" /> + <ngram occurrences="142" value="m" /> + <ngram occurrences="116" value="a_" /> + <ngram occurrences="108" value="v" /> + <ngram occurrences="85" value="h" /> + <ngram occurrences="82" value="y" /> + <ngram occurrences="80" value="ta" /> + <ngram occurrences="80" value="r" /> + <ngram occurrences="78" value="an" /> + <ngram occurrences="76" value="st" /> + <ngram occurrences="76" value="in" /> + <ngram occurrences="74" value="p" /> + <ngram occurrences="69" value="en" /> + <ngram occurrences="68" value="j" /> + <ngram occurrences="68" value="is" /> + <ngram occurrences="65" value="_k" /> + <ngram occurrences="60" value="it" /> + <ngram occurrences="55" value="si" /> + <ngram occurrences="55" value="aa" /> + <ngram occurrences="53" value="i_" /> + <ngram occurrences="52" value="ä_" /> + <ngram occurrences="52" value="tt" /> + <ngram occurrences="52" value="li" /> + <ngram occurrences="51" value="va" /> + <ngram occurrences="51" value="_t" /> + <ngram occurrences="50" value="ll" /> + <ngram occurrences="50" value="en_" /> + <ngram occurrences="49" value="mi" /> + <ngram occurrences="48" value="ka" /> + <ngram occurrences="47" value="se" /> + <ngram occurrences="45" value="te" /> + <ngram occurrences="45" value="an_" /> + <ngram occurrences="44" value="tä" /> + <ngram occurrences="43" value="tu" /> + <ngram occurrences="43" value="el" /> + <ngram occurrences="42" value="oi" /> + <ngram occurrences="42" value="ai" /> + <ngram occurrences="42" value="_o" /> + <ngram occurrences="41" value="_v" /> + <ngram occurrences="39" value="t_" /> + <ngram occurrences="39" value="ma" /> + <ngram occurrences="39" value="es" /> + <ngram occurrences="37" value="to" /> + <ngram occurrences="36" value="et" /> + <ngram occurrences="36" value="_s" /> + <ngram occurrences="35" value="d" /> + <ngram occurrences="35" value="_e" /> + <ngram occurrences="34" value="_p" /> + <ngram occurrences="33" value="ki" /> + <ngram occurrences="33" value="il" /> + <ngram occurrences="33" value="al" /> + <ngram occurrences="32" value="on" /> + <ngram occurrences="32" value="ol" /> + <ngram occurrences="31" value="us" /> + <ngram occurrences="31" value="la" /> + <ngram occurrences="31" value="e_" /> + <ngram occurrences="30" value="ku" /> + <ngram occurrences="30" value="ks" /> + <ngram occurrences="30" value="im" /> + <ngram occurrences="30" value="ik" /> + <ngram occurrences="30" value="_j" /> + <ngram occurrences="29" value="ta_" /> + <ngram occurrences="29" value="sa" /> + <ngram occurrences="29" value="ri" /> + <ngram occurrences="29" value="le" /> + <ngram occurrences="29" value="ja" /> + <ngram occurrences="29" value="in_" /> + <ngram occurrences="29" value="_m" /> + <ngram occurrences="29" value="_h" /> + <ngram occurrences="28" value="ti" /> + <ngram occurrences="28" value="ss" /> + <ngram occurrences="28" value="ke" /> + <ngram occurrences="28" value="at" /> + <ngram occurrences="27" value="uu" /> + <ngram occurrences="27" value="n_k" /> + <ngram occurrences="27" value="ko" /> + <ngram occurrences="26" value="nn" /> + <ngram occurrences="26" value="lu" /> + <ngram occurrences="26" value="ist" /> + <ngram occurrences="26" value="aan" /> + <ngram occurrences="25" value="sta" /> + <ngram occurrences="25" value="na" /> + <ngram occurrences="25" value="_va" /> + <ngram occurrences="24" value="ii" /> + <ngram occurrences="23" value="as" /> + <ngram occurrences="22" value="uo" /> + <ngram occurrences="22" value="tä_" /> + <ngram occurrences="21" value="ut" /> + <ngram occurrences="21" value="un" /> + <ngram occurrences="21" value="os" /> + <ngram occurrences="21" value="ne" /> + <ngram occurrences="21" value="ha" /> + <ngram occurrences="21" value="ei" /> + <ngram occurrences="21" value="aan_" /> + <ngram occurrences="20" value="ssa" /> + <ngram occurrences="20" value="nk" /> + <ngram occurrences="20" value="_l" /> + <ngram occurrences="19" value="on_" /> + <ngram occurrences="19" value="er" /> + <ngram occurrences="19" value="_a" /> + <ngram occurrences="18" value="vä" /> + <ngram occurrences="18" value="ty" /> + <ngram occurrences="18" value="tta" /> + <ngram occurrences="18" value="toi" /> + <ngram occurrences="18" value="sk" /> + <ngram occurrences="18" value="oim" /> + <ngram occurrences="18" value="n_t" /> + <ngram occurrences="18" value="me" /> + <ngram occurrences="18" value="ia" /> + <ngram occurrences="18" value="ar" /> + <ngram occurrences="18" value="ak" /> + <ngram occurrences="18" value="_ka" /> + <ngram occurrences="17" value="ö" /> + <ngram occurrences="17" value="ää" /> + <ngram occurrences="17" value="vi" /> + <ngram occurrences="17" value="sa_" /> + <ngram occurrences="17" value="nt" /> + <ngram occurrences="17" value="n_p" /> + <ngram occurrences="17" value="lä" /> + <ngram occurrences="17" value="ja_" /> + <ngram occurrences="17" value="ie" /> + <ngram occurrences="17" value="am" /> + <ngram occurrences="17" value="_to" /> + <ngram occurrences="16" value="yt" /> + <ngram occurrences="16" value="ul" /> + <ngram occurrences="16" value="su" /> + <ngram occurrences="16" value="sta_" /> + <ngram occurrences="16" value="ssa_" /> + <ngram occurrences="16" value="om" /> + <ngram occurrences="16" value="ni" /> + <ngram occurrences="16" value="n_v" /> + <ngram occurrences="16" value="lli" /> + <ngram occurrences="16" value="ksi" /> + <ngram occurrences="16" value="imi" /> + <ngram occurrences="16" value="de" /> + <ngram occurrences="15" value="toim" /> + <ngram occurrences="15" value="taa" /> + <ngram occurrences="15" value="ste" /> + <ngram occurrences="15" value="pa" /> + <ngram occurrences="15" value="oimi" /> + <ngram occurrences="15" value="min" /> + <ngram occurrences="15" value="ise" /> + <ngram occurrences="15" value="he" /> + <ngram occurrences="15" value="ett" /> + <ngram occurrences="15" value="ell" /> + <ngram occurrences="15" value="ee" /> + <ngram occurrences="15" value="ais" /> + <ngram occurrences="15" value="_on" /> + <ngram occurrences="15" value="_ol" /> + <ngram occurrences="15" value="_ko" /> + <ngram occurrences="15" value="_ja" /> + <ngram occurrences="15" value="_ha" /> + <ngram occurrences="14" value="toimi" /> + <ngram occurrences="14" value="lla" /> + <ngram occurrences="14" value="itt" /> + <ngram occurrences="14" value="est" /> + <ngram occurrences="14" value="all" /> + <ngram occurrences="14" value="aa_" /> + <ngram occurrences="14" value="a_o" /> + <ngram occurrences="14" value="a_k" /> + <ngram occurrences="14" value="_y" /> + <ngram occurrences="14" value="_n" /> + <ngram occurrences="13" value="vo" /> + <ngram occurrences="13" value="uk" /> + <ngram occurrences="13" value="sä" /> + <ngram occurrences="13" value="si_" /> + <ngram occurrences="13" value="pä" /> + <ngram occurrences="13" value="ok" /> + <ngram occurrences="13" value="lt" /> + <ngram occurrences="13" value="kse" /> + <ngram occurrences="13" value="kk" /> + <ngram occurrences="13" value="jo" /> + <ngram occurrences="13" value="je" /> + <ngram occurrences="13" value="em" /> + <ngram occurrences="13" value="au" /> + <ngram occurrences="13" value="at_" /> + <ngram occurrences="13" value="an_k" /> + <ngram occurrences="13" value="_toi" /> + <ngram occurrences="12" value="ts" /> + <ngram occurrences="12" value="sen" /> + <ngram occurrences="12" value="pi" /> + <ngram occurrences="12" value="ot" /> + <ngram occurrences="12" value="nki" /> + <ngram occurrences="12" value="n_s" /> + <ngram occurrences="12" value="le_" /> + <ngram occurrences="12" value="iv" /> + <ngram occurrences="12" value="iin" /> + <ngram occurrences="12" value="ht" /> + <ngram occurrences="12" value="_toim" /> + <ngram occurrences="12" value="_on_" /> + <ngram occurrences="12" value="_ke" /> + <ngram occurrences="12" value="_ja_" /> + <ngram occurrences="11" value="än" /> + <ngram occurrences="11" value="äl" /> + <ngram occurrences="11" value="äi" /> + <ngram occurrences="11" value="ust" /> + <ngram occurrences="11" value="up" /> + <ngram occurrences="11" value="tus" /> + <ngram occurrences="11" value="ttä" /> + <ngram occurrences="11" value="ten" /> + <ngram occurrences="11" value="s_" /> + <ngram occurrences="11" value="ole" /> + <ngram occurrences="11" value="nna" /> + <ngram occurrences="11" value="mu" /> + <ngram occurrences="11" value="mis" /> + <ngram occurrences="11" value="lle" /> + <ngram occurrences="11" value="lla_" /> + <ngram occurrences="11" value="lis" /> + <ngram occurrences="11" value="la_" /> + <ngram occurrences="11" value="ksi_" /> + <ngram occurrences="11" value="eri" /> + <ngram occurrences="11" value="av" /> + <ngram occurrences="11" value="ama" /> + <ngram occurrences="11" value="a_m" /> + <ngram occurrences="11" value="_tu" /> + <ngram occurrences="11" value="_ma" /> + <ngram occurrences="10" value="äv" /> + <ngram occurrences="10" value="ät" /> + <ngram occurrences="10" value="yy" /> + <ngram occurrences="10" value="yh" /> + <ngram occurrences="10" value="van" /> + <ngram occurrences="10" value="u_" /> + <ngram occurrences="10" value="oli" /> + <ngram occurrences="10" value="oit" /> + <ngram occurrences="10" value="nne" /> + <ngram occurrences="10" value="n_va" /> + <ngram occurrences="10" value="mm" /> + <ngram occurrences="10" value="lin" /> + <ngram occurrences="10" value="jä" /> + <ngram occurrences="10" value="ite" /> + <ngram occurrences="10" value="i_k" /> + <ngram occurrences="10" value="hal" /> + <ngram occurrences="10" value="ast" /> + <ngram occurrences="10" value="aj" /> + <ngram occurrences="10" value="ah" /> + <ngram occurrences="10" value="_ku" /> + <ngram occurrences="10" value="_jo" /> + <ngram occurrences="9" value="voi" /> + <ngram occurrences="9" value="uut" /> + <ngram occurrences="9" value="uks" /> + <ngram occurrences="9" value="stä" /> + <ngram occurrences="9" value="sti" /> + <ngram occurrences="9" value="ra" /> + <ngram occurrences="9" value="oj" /> + <ngram occurrences="9" value="nta" /> + <ngram occurrences="9" value="n_m" /> + <ngram occurrences="9" value="n_j" /> + <ngram occurrences="9" value="kau" /> + <ngram occurrences="9" value="io" /> + <ngram occurrences="9" value="iks" /> + <ngram occurrences="9" value="iin_" /> + <ngram occurrences="9" value="i_t" /> + <ngram occurrences="9" value="hu" /> + <ngram occurrences="9" value="hel" /> + <ngram occurrences="9" value="hd" /> + <ngram occurrences="9" value="g" /> + <ngram occurrences="9" value="et_" /> + <ngram occurrences="9" value="en_t" /> + <ngram occurrences="9" value="eh" /> + <ngram occurrences="9" value="alli" /> + <ngram occurrences="9" value="a_v" /> + <ngram occurrences="9" value="a_s" /> + <ngram occurrences="9" value="a_j" /> + <ngram occurrences="9" value="_ta" /> + <ngram occurrences="9" value="_su" /> + <ngram occurrences="9" value="_i" /> + <ngram occurrences="9" value="_et" /> + <ngram occurrences="8" value="är" /> + <ngram occurrences="8" value="ä_t" /> + <ngram occurrences="8" value="y_" /> + <ngram occurrences="8" value="vai" /> + <ngram occurrences="8" value="uv" /> + <ngram occurrences="8" value="ur" /> + <ngram occurrences="8" value="ulu" /> + <ngram occurrences="8" value="täv" /> + <ngram occurrences="8" value="ttaa" /> + <ngram occurrences="8" value="ten_" /> + <ngram occurrences="8" value="sä_" /> + <ngram occurrences="8" value="stu" /> + <ngram occurrences="8" value="ssä_" /> + <ngram occurrences="8" value="ssä" /> + <ngram occurrences="8" value="so" /> + <ngram occurrences="8" value="sia" /> + <ngram occurrences="8" value="ses" /> + <ngram occurrences="8" value="rk" /> + <ngram occurrences="8" value="rj" /> + <ngram occurrences="8" value="po" /> + <ngram occurrences="8" value="pe" /> + <ngram occurrences="8" value="ou" /> + <ngram occurrences="8" value="ost" /> + <ngram occurrences="8" value="op" /> + <ngram occurrences="8" value="no" /> + <ngram occurrences="8" value="nen_" /> + <ngram occurrences="8" value="nen" /> + <ngram occurrences="8" value="n_h" /> + <ngram occurrences="8" value="n_e" /> + <ngram occurrences="8" value="maa" /> + <ngram occurrences="8" value="lle_" /> + <ngram occurrences="8" value="lai" /> + <ngram occurrences="8" value="kä" /> + <ngram occurrences="8" value="kin" /> + <ngram occurrences="8" value="kesk" /> + <ngram occurrences="8" value="kes" /> + <ngram occurrences="8" value="kaup" /> + <ngram occurrences="8" value="kan" /> + <ngram occurrences="8" value="iste" /> + <ngram occurrences="8" value="isi" /> + <ngram occurrences="8" value="int" /> + <ngram occurrences="8" value="ine" /> + <ngram occurrences="8" value="ila" /> + <ngram occurrences="8" value="iksi_" /> + <ngram occurrences="8" value="iksi" /> + <ngram occurrences="8" value="ien" /> + <ngram occurrences="8" value="ia_" /> + <ngram occurrences="8" value="ess" /> + <ngram occurrences="8" value="esk" /> + <ngram occurrences="8" value="aup" /> + <ngram occurrences="8" value="ari" /> + <ngram occurrences="8" value="ank" /> + <ngram occurrences="8" value="a_e" /> + <ngram occurrences="8" value="_si" /> + <ngram occurrences="8" value="_pä" /> + <ngram occurrences="8" value="_ole" /> + <ngram occurrences="8" value="_kesk" /> + <ngram occurrences="8" value="_kes" /> + <ngram occurrences="8" value="_hal" /> + <ngram occurrences="7" value="ävä" /> + <ngram occurrences="7" value="äs" /> + <ngram occurrences="7" value="vat_" /> + <ngram occurrences="7" value="vat" /> + <ngram occurrences="7" value="val" /> + <ngram occurrences="7" value="ukse" /> + <ngram occurrences="7" value="ui" /> + <ngram occurrences="7" value="til" /> + <ngram occurrences="7" value="ti_" /> + <ngram occurrences="7" value="tet" /> + <ngram occurrences="7" value="tel" /> + <ngram occurrences="7" value="tav" /> + <ngram occurrences="7" value="taan_" /> + <ngram occurrences="7" value="taan" /> + <ngram occurrences="7" value="suu" /> + <ngram occurrences="7" value="suo" /> + <ngram occurrences="7" value="stä_" /> + <ngram occurrences="7" value="sku" /> + <ngram occurrences="7" value="sit" /> + <ngram occurrences="7" value="sen_" /> + <ngram occurrences="7" value="ri_" /> + <ngram occurrences="7" value="pu" /> + <ngram occurrences="7" value="pp" /> + <ngram occurrences="7" value="omi" /> + <ngram occurrences="7" value="oll" /> + <ngram occurrences="7" value="oimin" /> + <ngram occurrences="7" value="nä" /> + <ngram occurrences="7" value="ns" /> + <ngram occurrences="7" value="n_tu" /> + <ngram occurrences="7" value="n_o" /> + <ngram occurrences="7" value="n_ka" /> + <ngram occurrences="7" value="mä" /> + <ngram occurrences="7" value="lä_" /> + <ngram occurrences="7" value="lo" /> + <ngram occurrences="7" value="lm" /> + <ngram occurrences="7" value="llä" /> + <ngram occurrences="7" value="li_" /> + <ngram occurrences="7" value="lais" /> + <ngram occurrences="7" value="kin_" /> + <ngram occurrences="7" value="ita" /> + <ngram occurrences="7" value="iss" /> + <ngram occurrences="7" value="inn" /> + <ngram occurrences="7" value="inen_" /> + <ngram occurrences="7" value="inen" /> + <ngram occurrences="7" value="imin" /> + <ngram occurrences="7" value="ill" /> + <ngram occurrences="7" value="ho" /> + <ngram occurrences="7" value="ev" /> + <ngram occurrences="7" value="eu" /> + <ngram occurrences="7" value="ella" /> + <ngram occurrences="7" value="een" /> + <ngram occurrences="7" value="ava" /> + <ngram occurrences="7" value="aka" /> + <ngram occurrences="7" value="ain" /> + <ngram occurrences="7" value="a_l" /> + <ngram occurrences="7" value="_yh" /> + <ngram occurrences="7" value="_vai" /> + <ngram occurrences="7" value="_u" /> + <ngram occurrences="7" value="_suo" /> + <ngram occurrences="7" value="_se" /> + <ngram occurrences="7" value="_r" /> + <ngram occurrences="7" value="_mu" /> +</ngrams> diff --git a/src/plugins/language/french.klp b/src/plugins/language/french.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="830" value="_" /> + <ngram occurrences="558" value="e" /> + <ngram occurrences="338" value="s" /> + <ngram occurrences="303" value="i" /> + <ngram occurrences="285" value="r" /> + <ngram occurrences="283" value="n" /> + <ngram occurrences="282" value="a" /> + <ngram occurrences="256" value="t" /> + <ngram occurrences="226" value="e_" /> + <ngram occurrences="215" value="o" /> + <ngram occurrences="207" value="u" /> + <ngram occurrences="199" value="l" /> + <ngram occurrences="184" value="s_" /> + <ngram occurrences="184" value="d" /> + <ngram occurrences="139" value="_d" /> + <ngram occurrences="137" value="c" /> + <ngram occurrences="130" value="p" /> + <ngram occurrences="127" value="é" /> + <ngram occurrences="104" value="m" /> + <ngram occurrences="100" value="es" /> + <ngram occurrences="100" value="_l" /> + <ngram occurrences="85" value="t_" /> + <ngram occurrences="79" value="on" /> + <ngram occurrences="78" value="le" /> + <ngram occurrences="78" value="es_" /> + <ngram occurrences="78" value="de" /> + <ngram occurrences="72" value="_de" /> + <ngram occurrences="68" value="re" /> + <ngram occurrences="68" value="en" /> + <ngram occurrences="66" value="_a" /> + <ngram occurrences="64" value="f" /> + <ngram occurrences="60" value="_p" /> + <ngram occurrences="59" value="n_" /> + <ngram occurrences="56" value="_e" /> + <ngram occurrences="56" value="_c" /> + <ngram occurrences="54" value="de_" /> + <ngram occurrences="53" value="nt" /> + <ngram occurrences="53" value="g" /> + <ngram occurrences="52" value="r_" /> + <ngram occurrences="52" value="_de_" /> + <ngram occurrences="51" value="_le" /> + <ngram occurrences="48" value="v" /> + <ngram occurrences="48" value="an" /> + <ngram occurrences="48" value="_s" /> + <ngram occurrences="44" value="er" /> + <ngram occurrences="42" value="h" /> + <ngram occurrences="42" value="a_" /> + <ngram occurrences="40" value="qu" /> + <ngram occurrences="40" value="q" /> + <ngram occurrences="40" value="ai" /> + <ngram occurrences="38" value="ou" /> + <ngram occurrences="38" value="it" /> + <ngram occurrences="38" value="is" /> + <ngram occurrences="38" value="_m" /> + <ngram occurrences="36" value="le_" /> + <ngram occurrences="35" value="te" /> + <ngram occurrences="35" value="ra" /> + <ngram occurrences="35" value="ns" /> + <ngram occurrences="35" value="la" /> + <ngram occurrences="35" value="io" /> + <ngram occurrences="34" value="ti" /> + <ngram occurrences="34" value="e_d" /> + <ngram occurrences="34" value="co" /> + <ngram occurrences="33" value="u_" /> + <ngram occurrences="33" value="se" /> + <ngram occurrences="32" value="ion" /> + <ngram occurrences="31" value="les_" /> + <ngram occurrences="31" value="les" /> + <ngram occurrences="30" value="s_d" /> + <ngram occurrences="30" value="in" /> + <ngram occurrences="30" value="ie" /> + <ngram occurrences="29" value="ur" /> + <ngram occurrences="29" value="_f" /> + <ngram occurrences="28" value="é_" /> + <ngram occurrences="28" value="re_" /> + <ngram occurrences="28" value="nt_" /> + <ngram occurrences="28" value="b" /> + <ngram occurrences="27" value="pr" /> + <ngram occurrences="27" value="on_" /> + <ngram occurrences="27" value="ar" /> + <ngram occurrences="27" value="_t" /> + <ngram occurrences="26" value="et" /> + <ngram occurrences="26" value="ent" /> + <ngram occurrences="26" value="di" /> + <ngram occurrences="26" value="_r" /> + <ngram occurrences="26" value="_le_" /> + <ngram occurrences="25" value="tr" /> + <ngram occurrences="25" value="ns_" /> + <ngram occurrences="25" value="me" /> + <ngram occurrences="25" value="l_" /> + <ngram occurrences="25" value="e_l" /> + <ngram occurrences="25" value="ce" /> + <ngram occurrences="25" value="_qu" /> + <ngram occurrences="25" value="_q" /> + <ngram occurrences="25" value="_la" /> + <ngram occurrences="25" value="_co" /> + <ngram occurrences="24" value="è" /> + <ngram occurrences="24" value="ui" /> + <ngram occurrences="24" value="_i" /> + <ngram occurrences="23" value="po" /> + <ngram occurrences="23" value="pa" /> + <ngram occurrences="23" value="la_" /> + <ngram occurrences="23" value="ir" /> + <ngram occurrences="23" value="au" /> + <ngram occurrences="23" value="_les_" /> + <ngram occurrences="23" value="_les" /> + <ngram occurrences="23" value="_la_" /> + <ngram occurrences="22" value="ue" /> + <ngram occurrences="22" value="t_d" /> + <ngram occurrences="22" value="s_l" /> + <ngram occurrences="22" value="ro" /> + <ngram occurrences="22" value="or" /> + <ngram occurrences="22" value="nd" /> + <ngram occurrences="22" value="ion_" /> + <ngram occurrences="22" value="eu" /> + <ngram occurrences="22" value="at" /> + <ngram occurrences="21" value="tion" /> + <ngram occurrences="21" value="tio" /> + <ngram occurrences="21" value="st" /> + <ngram occurrences="21" value="nc" /> + <ngram occurrences="21" value="e_de" /> + <ngram occurrences="21" value="dé" /> + <ngram occurrences="21" value="ch" /> + <ngram occurrences="20" value="si" /> + <ngram occurrences="20" value="ons" /> + <ngram occurrences="20" value="ne" /> + <ngram occurrences="20" value="et_" /> + <ngram occurrences="20" value="_pa" /> + <ngram occurrences="20" value="_en" /> + <ngram occurrences="19" value="ve" /> + <ngram occurrences="19" value="un" /> + <ngram occurrences="19" value="ts" /> + <ngram occurrences="19" value="ss" /> + <ngram occurrences="19" value="s_c" /> + <ngram occurrences="19" value="que" /> + <ngram occurrences="19" value="er_" /> + <ngram occurrences="18" value="té" /> + <ngram occurrences="18" value="ts_" /> + <ngram occurrences="18" value="it_" /> + <ngram occurrences="18" value="il" /> + <ngram occurrences="18" value="i_" /> + <ngram occurrences="18" value="el" /> + <ngram occurrences="18" value="e_s" /> + <ngram occurrences="18" value="_n" /> + <ngram occurrences="17" value="sa" /> + <ngram occurrences="17" value="ré" /> + <ngram occurrences="17" value="ma" /> + <ngram occurrences="17" value="e_c" /> + <ngram occurrences="17" value="d_" /> + <ngram occurrences="17" value="_et" /> + <ngram occurrences="17" value="_dé" /> + <ngram occurrences="16" value="x" /> + <ngram occurrences="16" value="se_" /> + <ngram occurrences="16" value="s_p" /> + <ngram occurrences="16" value="s_de" /> + <ngram occurrences="16" value="li" /> + <ngram occurrences="16" value="_et_" /> + <ngram occurrences="15" value="à_" /> + <ngram occurrences="15" value="à" /> + <ngram occurrences="15" value="ut" /> + <ngram occurrences="15" value="s_a" /> + <ngram occurrences="15" value="ri" /> + <ngram occurrences="15" value="om" /> + <ngram occurrences="15" value="n_d" /> + <ngram occurrences="15" value="j" /> + <ngram occurrences="15" value="ent_" /> + <ngram occurrences="15" value="e_e" /> + <ngram occurrences="15" value="e_de_" /> + <ngram occurrences="15" value="ci" /> + <ngram occurrences="15" value="ap" /> + <ngram occurrences="15" value="_à_" /> + <ngram occurrences="15" value="_à" /> + <ngram occurrences="15" value="_u" /> + <ngram occurrences="15" value="_se" /> + <ngram occurrences="15" value="_pr" /> + <ngram occurrences="15" value="_g" /> + <ngram occurrences="14" value="ér" /> + <ngram occurrences="14" value="tion_" /> + <ngram occurrences="14" value="s_le" /> + <ngram occurrences="14" value="rt" /> + <ngram occurrences="14" value="pe" /> + <ngram occurrences="14" value="par" /> + <ngram occurrences="14" value="ont" /> + <ngram occurrences="14" value="oi" /> + <ngram occurrences="14" value="mi" /> + <ngram occurrences="14" value="he" /> + <ngram occurrences="14" value="en_" /> + <ngram occurrences="14" value="em" /> + <ngram occurrences="14" value="ec" /> + <ngram occurrences="14" value="e_p" /> + <ngram occurrences="14" value="e_m" /> + <ngram occurrences="14" value="e_f" /> + <ngram occurrences="14" value="e_a" /> + <ngram occurrences="14" value="con" /> + <ngram occurrences="14" value="as" /> + <ngram occurrences="14" value="ait" /> + <ngram occurrences="14" value="_par" /> + <ngram occurrences="14" value="_l_" /> + <ngram occurrences="13" value="és" /> + <ngram occurrences="13" value="ue_" /> + <ngram occurrences="13" value="té_" /> + <ngram occurrences="13" value="te_" /> + <ngram occurrences="13" value="so" /> + <ngram occurrences="13" value="s_r" /> + <ngram occurrences="13" value="s_de_" /> + <ngram occurrences="13" value="r_l" /> + <ngram occurrences="13" value="ons_" /> + <ngram occurrences="13" value="mp" /> + <ngram occurrences="13" value="is_" /> + <ngram occurrences="13" value="ire" /> + <ngram occurrences="13" value="_un" /> + <ngram occurrences="13" value="_re" /> + <ngram occurrences="13" value="_o" /> + <ngram occurrences="13" value="_j" /> + <ngram occurrences="13" value="_in" /> + <ngram occurrences="13" value="_di" /> + <ngram occurrences="13" value="_d_" /> + <ngram occurrences="13" value="_con" /> + <ngram occurrences="13" value="_ce" /> + <ngram occurrences="12" value="ès_" /> + <ngram occurrences="12" value="ès" /> + <ngram occurrences="12" value="y" /> + <ngram occurrences="12" value="vi" /> + <ngram occurrences="12" value="ur_" /> + <ngram occurrences="12" value="ta" /> + <ngram occurrences="12" value="su" /> + <ngram occurrences="12" value="our" /> + <ngram occurrences="12" value="ni" /> + <ngram occurrences="12" value="ne_" /> + <ngram occurrences="12" value="mo" /> + <ngram occurrences="12" value="ge" /> + <ngram occurrences="12" value="fi" /> + <ngram occurrences="12" value="est" /> + <ngram occurrences="12" value="es_r" /> + <ngram occurrences="12" value="es_d" /> + <ngram occurrences="12" value="bl" /> + <ngram occurrences="12" value="av" /> + <ngram occurrences="12" value="_so" /> + <ngram occurrences="12" value="_h" /> + <ngram occurrences="11" value="ét" /> + <ngram occurrences="11" value="x_" /> + <ngram occurrences="11" value="un_" /> + <ngram occurrences="11" value="rs" /> + <ngram occurrences="11" value="res" /> + <ngram occurrences="11" value="que_" /> + <ngram occurrences="11" value="né" /> + <ngram occurrences="11" value="me_" /> + <ngram occurrences="11" value="e_le" /> + <ngram occurrences="11" value="des_" /> + <ngram occurrences="11" value="des" /> + <ngram occurrences="11" value="che" /> + <ngram occurrences="11" value="au_" /> + <ngram occurrences="11" value="ait_" /> + <ngram occurrences="11" value="ais" /> + <ngram occurrences="11" value="_su" /> + <ngram occurrences="11" value="_mo" /> + <ngram occurrences="11" value="_ma" /> + <ngram occurrences="11" value="_en_" /> + <ngram occurrences="11" value="_des_" /> + <ngram occurrences="11" value="_des" /> + <ngram occurrences="11" value="_av" /> + <ngram occurrences="11" value="_an" /> + <ngram occurrences="10" value="ée" /> + <ngram occurrences="10" value="éc" /> + <ngram occurrences="10" value="à_l" /> + <ngram occurrences="10" value="ux" /> + <ngram occurrences="10" value="us" /> + <ngram occurrences="10" value="up" /> + <ngram occurrences="10" value="ui_" /> + <ngram occurrences="10" value="t_de" /> + <ngram occurrences="10" value="sé" /> + <ngram occurrences="10" value="s_s" /> + <ngram occurrences="10" value="s_e" /> + <ngram occurrences="10" value="r_d" /> + <ngram occurrences="10" value="pro" /> + <ngram occurrences="10" value="pp" /> + <ngram occurrences="10" value="pl" /> + <ngram occurrences="10" value="nt_d" /> + <ngram occurrences="10" value="n_de" /> + <ngram occurrences="10" value="iqu" /> + <ngram occurrences="10" value="iq" /> + <ngram occurrences="10" value="ions_" /> + <ngram occurrences="10" value="ions" /> + <ngram occurrences="10" value="il_" /> + <ngram occurrences="10" value="ien" /> + <ngram occurrences="10" value="ic" /> + <ngram occurrences="10" value="e_qu" /> + <ngram occurrences="10" value="e_q" /> + <ngram occurrences="10" value="du" /> + <ngram occurrences="10" value="da" /> + <ngram occurrences="10" value="ces" /> + <ngram occurrences="10" value="ati" /> + <ngram occurrences="10" value="ans" /> + <ngram occurrences="10" value="_à_l" /> + <ngram occurrences="10" value="_il" /> + <ngram occurrences="10" value="_b" /> + <ngram occurrences="10" value="_au" /> + <ngram occurrences="10" value="_a_" /> + <ngram occurrences="9" value="tre" /> + <ngram occurrences="9" value="to" /> + <ngram occurrences="9" value="s_le_" /> + <ngram occurrences="9" value="rès_" /> + <ngram occurrences="9" value="rès" /> + <ngram occurrences="9" value="rè" /> + <ngram occurrences="9" value="rs_" /> + <ngram occurrences="9" value="r_le" /> + <ngram occurrences="9" value="qui_" /> + <ngram occurrences="9" value="qui" /> + <ngram occurrences="9" value="on_d" /> + <ngram occurrences="9" value="nte" /> + <ngram occurrences="9" value="men" /> + <ngram occurrences="9" value="ll" /> + <ngram occurrences="9" value="ique" /> + <ngram occurrences="9" value="ion_d" /> + <ngram occurrences="9" value="id" /> + <ngram occurrences="9" value="fo" /> + <ngram occurrences="9" value="e_n" /> + <ngram occurrences="9" value="e_co" /> + <ngram occurrences="9" value="dr" /> + <ngram occurrences="9" value="de_l" /> + <ngram occurrences="9" value="com" /> + <ngram occurrences="9" value="ces_" /> + <ngram occurrences="9" value="ce_" /> + <ngram occurrences="9" value="c_" /> + <ngram occurrences="9" value="ation" /> + <ngram occurrences="9" value="atio" /> + <ngram occurrences="9" value="ans_" /> + <ngram occurrences="9" value="anc" /> + <ngram occurrences="9" value="al" /> + <ngram occurrences="9" value="_un_" /> + <ngram occurrences="9" value="_tr" /> + <ngram occurrences="9" value="_qui_" /> + <ngram occurrences="9" value="_qui" /> + <ngram occurrences="9" value="_pro" /> + <ngram occurrences="9" value="_il_" /> + <ngram occurrences="9" value="_es" /> + <ngram occurrences="9" value="_ch" /> + <ngram occurrences="9" value="_au_" /> + <ngram occurrences="8" value="ê" /> + <ngram occurrences="8" value="ég" /> + <ngram occurrences="8" value="ée_" /> + <ngram occurrences="8" value="é_d" /> + <ngram occurrences="8" value="à_la" /> + <ngram occurrences="8" value="ux_" /> + <ngram occurrences="8" value="t_p" /> + <ngram occurrences="8" value="t_de_" /> + <ngram occurrences="8" value="t_c" /> + <ngram occurrences="8" value="st_" /> + <ngram occurrences="8" value="ser" /> + <ngram occurrences="8" value="s_m" /> + <ngram occurrences="8" value="rec" /> + <ngram occurrences="8" value="r_de" /> + <ngram occurrences="8" value="pu" /> + <ngram occurrences="8" value="oup" /> + <ngram occurrences="8" value="ont_" /> + <ngram occurrences="8" value="no" /> + <ngram occurrences="8" value="nn" /> + <ngram occurrences="8" value="ndr" /> + <ngram occurrences="8" value="ndi" /> + <ngram occurrences="8" value="na" /> + <ngram occurrences="8" value="mé" /> + <ngram occurrences="8" value="ment" /> + <ngram occurrences="8" value="mai" /> + <ngram occurrences="8" value="lé" /> + <ngram occurrences="8" value="ité" /> + <ngram occurrences="8" value="ig" /> + <ngram occurrences="8" value="if" /> + <ngram occurrences="8" value="ier" /> + <ngram occurrences="8" value="he_" /> + <ngram occurrences="8" value="ha" /> + <ngram occurrences="8" value="gr" /> + <ngram occurrences="8" value="ff" /> + <ngram occurrences="8" value="est_" /> + <ngram occurrences="8" value="es_c" /> + <ngram occurrences="8" value="ent_d" /> + <ngram occurrences="8" value="ement" /> + <ngram occurrences="8" value="emen" /> + <ngram occurrences="8" value="eme" /> + <ngram occurrences="8" value="do" /> + <ngram occurrences="8" value="de_f" /> + <ngram occurrences="8" value="ct" /> + <ngram occurrences="8" value="ca" /> + <ngram occurrences="8" value="app" /> + <ngram occurrences="8" value="ant" /> + <ngram occurrences="8" value="_é" /> + <ngram occurrences="8" value="_à_la" /> + <ngram occurrences="8" value="_v" /> + <ngram occurrences="8" value="_to" /> + <ngram occurrences="8" value="_po" /> + <ngram occurrences="8" value="_est_" /> + <ngram occurrences="8" value="_est" /> + <ngram occurrences="8" value="_do" /> + <ngram occurrences="8" value="_de_l" /> + <ngram occurrences="8" value="_de_f" /> + <ngram occurrences="8" value="_ap" /> + <ngram occurrences="7" value="és_" /> + <ngram occurrences="7" value="él" /> + <ngram occurrences="7" value="é_l" /> + <ngram occurrences="7" value="va" /> + <ngram occurrences="7" value="um" /> +</ngrams> diff --git a/src/plugins/language/frisian.klp b/src/plugins/language/frisian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="829" value="_" /> + <ngram occurrences="604" value="e" /> + <ngram occurrences="352" value="n" /> + <ngram occurrences="277" value="t" /> + <ngram occurrences="270" value="a" /> + <ngram occurrences="251" value="i" /> + <ngram occurrences="248" value="r" /> + <ngram occurrences="240" value="s" /> + <ngram occurrences="201" value="n_" /> + <ngram occurrences="184" value="o" /> + <ngram occurrences="174" value="d" /> + <ngram occurrences="161" value="e_" /> + <ngram occurrences="147" value="l" /> + <ngram occurrences="146" value="k" /> + <ngram occurrences="135" value="t_" /> + <ngram occurrences="125" value="en" /> + <ngram occurrences="106" value="en_" /> + <ngram occurrences="103" value="m" /> + <ngram occurrences="100" value="f" /> + <ngram occurrences="96" value="_d" /> + <ngram occurrences="90" value="er" /> + <ngram occurrences="89" value="h" /> + <ngram occurrences="88" value="y" /> + <ngram occurrences="88" value="de" /> + <ngram occurrences="86" value="w" /> + <ngram occurrences="86" value="p" /> + <ngram occurrences="77" value="u" /> + <ngram occurrences="71" value="_f" /> + <ngram occurrences="70" value="j" /> + <ngram occurrences="66" value="_s" /> + <ngram occurrences="65" value="b" /> + <ngram occurrences="62" value="in" /> + <ngram occurrences="61" value="_w" /> + <ngram occurrences="61" value="_i" /> + <ngram occurrences="60" value="s_" /> + <ngram occurrences="55" value="r_" /> + <ngram occurrences="53" value="_e" /> + <ngram occurrences="52" value="te" /> + <ngram occurrences="52" value="an" /> + <ngram occurrences="51" value="de_" /> + <ngram occurrences="50" value="g" /> + <ngram occurrences="50" value="_de" /> + <ngram occurrences="45" value="at" /> + <ngram occurrences="45" value="ar" /> + <ngram occurrences="45" value="_o" /> + <ngram occurrences="45" value="_b" /> + <ngram occurrences="43" value="_h" /> + <ngram occurrences="39" value="sk" /> + <ngram occurrences="39" value="ie" /> + <ngram occurrences="39" value="_de_" /> + <ngram occurrences="37" value="ke" /> + <ngram occurrences="36" value="st" /> + <ngram occurrences="36" value="ne" /> + <ngram occurrences="36" value="an_" /> + <ngram occurrences="36" value="_t" /> + <ngram occurrences="35" value="it" /> + <ngram occurrences="35" value="_m" /> + <ngram occurrences="34" value="oa" /> + <ngram occurrences="34" value="ei" /> + <ngram occurrences="33" value="yn" /> + <ngram occurrences="33" value="le" /> + <ngram occurrences="33" value="c" /> + <ngram occurrences="33" value="at_" /> + <ngram occurrences="32" value="re" /> + <ngram occurrences="32" value="er_" /> + <ngram occurrences="32" value="ch" /> + <ngram occurrences="31" value="n_d" /> + <ngram occurrences="30" value="je" /> + <ngram occurrences="29" value="me" /> + <ngram occurrences="29" value="et" /> + <ngram occurrences="28" value="k_" /> + <ngram occurrences="28" value="_k" /> + <ngram occurrences="27" value="yn_" /> + <ngram occurrences="27" value="se" /> + <ngram occurrences="27" value="oe" /> + <ngram occurrences="27" value="in_" /> + <ngram occurrences="26" value="op" /> + <ngram occurrences="26" value="_n" /> + <ngram occurrences="26" value="_en_" /> + <ngram occurrences="26" value="_en" /> + <ngram occurrences="25" value="p_" /> + <ngram occurrences="25" value="it_" /> + <ngram occurrences="25" value="es" /> + <ngram occurrences="25" value="_a" /> + <ngram occurrences="24" value="ri" /> + <ngram occurrences="24" value="ha" /> + <ngram occurrences="24" value="da" /> + <ngram occurrences="24" value="be" /> + <ngram occurrences="24" value="al" /> + <ngram occurrences="24" value="_y" /> + <ngram occurrences="23" value="sj" /> + <ngram occurrences="23" value="ol" /> + <ngram occurrences="23" value="ns" /> + <ngram occurrences="23" value="el" /> + <ngram occurrences="23" value="_yn" /> + <ngram occurrences="22" value="y_" /> + <ngram occurrences="22" value="ro" /> + <ngram occurrences="22" value="m_" /> + <ngram occurrences="22" value="i_" /> + <ngram occurrences="22" value="fa" /> + <ngram occurrences="22" value="_in" /> + <ngram occurrences="21" value="we" /> + <ngram occurrences="21" value="ei_" /> + <ngram occurrences="21" value="ea" /> + <ngram occurrences="21" value="_p" /> + <ngram occurrences="21" value="_in_" /> + <ngram occurrences="21" value="_fa" /> + <ngram occurrences="20" value="li" /> + <ngram occurrences="20" value="ge" /> + <ngram occurrences="20" value="ek" /> + <ngram occurrences="20" value="am" /> + <ngram occurrences="20" value="_it" /> + <ngram occurrences="19" value="wa" /> + <ngram occurrences="19" value="ter" /> + <ngram occurrences="19" value="ske" /> + <ngram occurrences="19" value="op_" /> + <ngram occurrences="19" value="ma" /> + <ngram occurrences="19" value="l_" /> + <ngram occurrences="19" value="fo" /> + <ngram occurrences="19" value="fe" /> + <ngram occurrences="19" value="et_" /> + <ngram occurrences="19" value="_yn_" /> + <ngram occurrences="19" value="_op" /> + <ngram occurrences="19" value="_it_" /> + <ngram occurrences="19" value="_ha" /> + <ngram occurrences="19" value="_fo" /> + <ngram occurrences="19" value="_da" /> + <ngram occurrences="19" value="_be" /> + <ngram occurrences="18" value="rd" /> + <ngram occurrences="18" value="fan_" /> + <ngram occurrences="18" value="fan" /> + <ngram occurrences="18" value="ar_" /> + <ngram occurrences="18" value="aa" /> + <ngram occurrences="18" value="_g" /> + <ngram occurrences="18" value="_fan_" /> + <ngram occurrences="18" value="_fan" /> + <ngram occurrences="17" value="t_d" /> + <ngram occurrences="17" value="oar" /> + <ngram occurrences="17" value="nt" /> + <ngram occurrences="17" value="n_de" /> + <ngram occurrences="17" value="is" /> + <ngram occurrences="17" value="der" /> + <ngram occurrences="17" value="_r" /> + <ngram occurrences="16" value="û" /> + <ngram occurrences="16" value="om" /> + <ngram occurrences="16" value="nn" /> + <ngram occurrences="16" value="n_s" /> + <ngram occurrences="16" value="n_f" /> + <ngram occurrences="16" value="je_" /> + <ngram occurrences="16" value="e_f" /> + <ngram occurrences="16" value="dat" /> + <ngram occurrences="16" value="_op_" /> + <ngram occurrences="16" value="_l" /> + <ngram occurrences="15" value="ê" /> + <ngram occurrences="15" value="ti" /> + <ngram occurrences="15" value="st_" /> + <ngram occurrences="15" value="mei" /> + <ngram occurrences="15" value="ll" /> + <ngram occurrences="15" value="h_" /> + <ngram occurrences="15" value="di" /> + <ngram occurrences="15" value="dat_" /> + <ngram occurrences="15" value="_wa" /> + <ngram occurrences="15" value="_se" /> + <ngram occurrences="15" value="_ne" /> + <ngram occurrences="15" value="_j" /> + <ngram occurrences="15" value="_dat_" /> + <ngram occurrences="15" value="_dat" /> + <ngram occurrences="14" value="ys" /> + <ngram occurrences="14" value="ts" /> + <ngram occurrences="14" value="t_f" /> + <ngram occurrences="14" value="sje" /> + <ngram occurrences="14" value="och" /> + <ngram occurrences="14" value="oc" /> + <ngram occurrences="14" value="n_w" /> + <ngram occurrences="14" value="n_o" /> + <ngram occurrences="14" value="n_de_" /> + <ngram occurrences="14" value="le_" /> + <ngram occurrences="14" value="jo" /> + <ngram occurrences="14" value="fer" /> + <ngram occurrences="14" value="eu" /> + <ngram occurrences="14" value="en_d" /> + <ngram occurrences="14" value="ed" /> + <ngram occurrences="14" value="ch_" /> + <ngram occurrences="14" value="ak" /> + <ngram occurrences="14" value="_me" /> + <ngram occurrences="13" value="v" /> + <ngram occurrences="13" value="tr" /> + <ngram occurrences="13" value="ry" /> + <ngram occurrences="13" value="rs" /> + <ngram occurrences="13" value="nne" /> + <ngram occurrences="13" value="ng" /> + <ngram occurrences="13" value="n_i" /> + <ngram occurrences="13" value="n_e" /> + <ngram occurrences="13" value="mei_" /> + <ngram occurrences="13" value="ik" /> + <ngram occurrences="13" value="a_" /> + <ngram occurrences="13" value="_oa" /> + <ngram occurrences="13" value="_ma" /> + <ngram occurrences="13" value="_fe" /> + <ngram occurrences="12" value="wi" /> + <ngram occurrences="12" value="ur" /> + <ngram occurrences="12" value="tt" /> + <ngram occurrences="12" value="nt_" /> + <ngram occurrences="12" value="lle" /> + <ngram occurrences="12" value="is_" /> + <ngram occurrences="12" value="ht" /> + <ngram occurrences="12" value="e_m" /> + <ngram occurrences="12" value="e_b" /> + <ngram occurrences="12" value="der_" /> + <ngram occurrences="12" value="d_" /> + <ngram occurrences="12" value="cht" /> + <ngram occurrences="12" value="_we" /> + <ngram occurrences="12" value="_tr" /> + <ngram occurrences="12" value="_mei" /> + <ngram occurrences="12" value="_fer" /> + <ngram occurrences="11" value="ysk" /> + <ngram occurrences="11" value="wo" /> + <ngram occurrences="11" value="ut" /> + <ngram occurrences="11" value="ten" /> + <ngram occurrences="11" value="te_" /> + <ngram occurrences="11" value="t_i" /> + <ngram occurrences="11" value="t_h" /> + <ngram occurrences="11" value="sy" /> + <ngram occurrences="11" value="ra" /> + <ngram occurrences="11" value="po" /> + <ngram occurrences="11" value="net_" /> + <ngram occurrences="11" value="net" /> + <ngram occurrences="11" value="kr" /> + <ngram occurrences="11" value="ken" /> + <ngram occurrences="11" value="ke_" /> + <ngram occurrences="11" value="ka" /> + <ngram occurrences="11" value="ji" /> + <ngram occurrences="11" value="foar" /> + <ngram occurrences="11" value="foa" /> + <ngram occurrences="11" value="ers" /> + <ngram occurrences="11" value="en_f" /> + <ngram occurrences="11" value="ear" /> + <ngram occurrences="11" value="e_w" /> + <ngram occurrences="11" value="e_k" /> + <ngram occurrences="11" value="e_e" /> + <ngram occurrences="11" value="e_d" /> + <ngram occurrences="11" value="den_" /> + <ngram occurrences="11" value="den" /> + <ngram occurrences="11" value="as" /> + <ngram occurrences="11" value="_mei_" /> + <ngram occurrences="11" value="_foar" /> + <ngram occurrences="11" value="_foa" /> + <ngram occurrences="10" value="wat_" /> + <ngram occurrences="10" value="wat" /> + <ngram occurrences="10" value="us" /> + <ngram occurrences="10" value="un" /> + <ngram occurrences="10" value="tu" /> + <ngram occurrences="10" value="tte" /> + <ngram occurrences="10" value="tsj" /> + <ngram occurrences="10" value="t_s" /> + <ngram occurrences="10" value="t_de" /> + <ngram occurrences="10" value="rys" /> + <ngram occurrences="10" value="re_" /> + <ngram occurrences="10" value="oar_" /> + <ngram occurrences="10" value="oan" /> + <ngram occurrences="10" value="ne_" /> + <ngram occurrences="10" value="lle_" /> + <ngram occurrences="10" value="ko" /> + <ngram occurrences="10" value="inne" /> + <ngram occurrences="10" value="inn" /> + <ngram occurrences="10" value="ing" /> + <ngram occurrences="10" value="he" /> + <ngram occurrences="10" value="gr" /> + <ngram occurrences="10" value="fr" /> + <ngram occurrences="10" value="f_" /> + <ngram occurrences="10" value="es_" /> + <ngram occurrences="10" value="en_o" /> + <ngram occurrences="10" value="ek_" /> + <ngram occurrences="10" value="e_s" /> + <ngram occurrences="10" value="br" /> + <ngram occurrences="10" value="an_d" /> + <ngram occurrences="10" value="_wat_" /> + <ngram occurrences="10" value="_wat" /> + <ngram occurrences="10" value="_net_" /> + <ngram occurrences="10" value="_net" /> + <ngram occurrences="10" value="_fr" /> + <ngram occurrences="10" value="_al" /> + <ngram occurrences="9" value="ú" /> + <ngram occurrences="9" value="â" /> + <ngram occurrences="9" value="z" /> + <ngram occurrences="9" value="wur" /> + <ngram occurrences="9" value="wu" /> + <ngram occurrences="9" value="wer" /> + <ngram occurrences="9" value="t_w" /> + <ngram occurrences="9" value="t_e" /> + <ngram occurrences="9" value="ske_" /> + <ngram occurrences="9" value="s_d" /> + <ngram occurrences="9" value="nne_" /> + <ngram occurrences="9" value="n_h" /> + <ngram occurrences="9" value="ld" /> + <ngram occurrences="9" value="kt" /> + <ngram occurrences="9" value="ken_" /> + <ngram occurrences="9" value="ins" /> + <ngram occurrences="9" value="inne_" /> + <ngram occurrences="9" value="ij" /> + <ngram occurrences="9" value="ier" /> + <ngram occurrences="9" value="id" /> + <ngram occurrences="9" value="hi" /> + <ngram occurrences="9" value="do" /> + <ngram occurrences="9" value="die" /> + <ngram occurrences="9" value="_ú" /> + <ngram occurrences="9" value="_wur" /> + <ngram occurrences="9" value="_wu" /> + <ngram occurrences="9" value="_wi" /> + <ngram occurrences="9" value="_oan" /> + <ngram occurrences="9" value="_ek_" /> + <ngram occurrences="9" value="_ek" /> + <ngram occurrences="9" value="_der_" /> + <ngram occurrences="9" value="_der" /> + <ngram occurrences="8" value="ten_" /> + <ngram occurrences="8" value="t_de_" /> + <ngram occurrences="8" value="t_b" /> + <ngram occurrences="8" value="so" /> + <ngram occurrences="8" value="rysk" /> + <ngram occurrences="8" value="rt" /> + <ngram occurrences="8" value="rde" /> + <ngram occurrences="8" value="pp" /> + <ngram occurrences="8" value="pe" /> + <ngram occurrences="8" value="on" /> + <ngram occurrences="8" value="ns_" /> + <ngram occurrences="8" value="no" /> + <ngram occurrences="8" value="nd" /> + <ngram occurrences="8" value="n_b" /> + <ngram occurrences="8" value="mme" /> + <ngram occurrences="8" value="mm" /> + <ngram occurrences="8" value="mi" /> + <ngram occurrences="8" value="ls" /> + <ngram occurrences="8" value="lde" /> + <ngram occurrences="8" value="ks" /> + <ngram occurrences="8" value="kl" /> + <ngram occurrences="8" value="ki" /> + <ngram occurrences="8" value="im" /> + <ngram occurrences="8" value="il" /> + <ngram occurrences="8" value="frys" /> + <ngram occurrences="8" value="fry" /> + <ngram occurrences="8" value="foar_" /> + <ngram occurrences="8" value="est" /> + <ngram occurrences="8" value="ere" /> + <ngram occurrences="8" value="ep" /> + <ngram occurrences="8" value="en_w" /> + <ngram occurrences="8" value="en_e" /> + <ngram occurrences="8" value="e_o" /> + <ngram occurrences="8" value="e_i" /> + <ngram occurrences="8" value="e_h" /> + <ngram occurrences="8" value="at_d" /> + <ngram occurrences="8" value="an_de" /> + <ngram occurrences="8" value="alle" /> + <ngram occurrences="8" value="all" /> + <ngram occurrences="8" value="_wo" /> + <ngram occurrences="8" value="_wer" /> + <ngram occurrences="8" value="_sy" /> + <ngram occurrences="8" value="_st" /> + <ngram occurrences="8" value="_so" /> + <ngram occurrences="8" value="_sk" /> + <ngram occurrences="8" value="_is_" /> + <ngram occurrences="8" value="_is" /> + <ngram occurrences="8" value="_hi" /> + <ngram occurrences="8" value="_ge" /> + <ngram occurrences="8" value="_frys" /> + <ngram occurrences="8" value="_fry" /> + <ngram occurrences="8" value="_e_" /> + <ngram occurrences="7" value="ûn" /> + <ngram occurrences="7" value="ân" /> + <ngram occurrences="7" value="wol" /> + <ngram occurrences="7" value="u_" /> + <ngram occurrences="7" value="t_o" /> + <ngram occurrences="7" value="t_m" /> + <ngram occurrences="7" value="syn_" /> + <ngram occurrences="7" value="syn" /> + <ngram occurrences="7" value="ste" /> + <ngram occurrences="7" value="sp" /> + <ngram occurrences="7" value="sken" /> + <ngram occurrences="7" value="sel" /> + <ngram occurrences="7" value="r_i" /> + <ngram occurrences="7" value="pa" /> + <ngram occurrences="7" value="om_" /> + <ngram occurrences="7" value="of" /> + <ngram occurrences="7" value="oan_" /> + <ngram occurrences="7" value="ng_" /> + <ngram occurrences="7" value="nde" /> + <ngram occurrences="7" value="n_k" /> + <ngram occurrences="7" value="n_da" /> + <ngram occurrences="7" value="lik" /> + <ngram occurrences="7" value="jen" /> + <ngram occurrences="7" value="ite" /> + <ngram occurrences="7" value="ich" /> + <ngram occurrences="7" value="ic" /> + <ngram occurrences="7" value="ht_" /> + <ngram occurrences="7" value="hat_" /> + <ngram occurrences="7" value="hat" /> + <ngram occurrences="7" value="gen" /> + <ngram occurrences="7" value="g_" /> + <ngram occurrences="7" value="frysk" /> + <ngram occurrences="7" value="fan_d" /> + <ngram occurrences="7" value="erd" /> +</ngrams> diff --git a/src/plugins/language/georgian.klp b/src/plugins/language/georgian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="641" value="_" /> + <ngram occurrences="604" value="à" /> + <ngram occurrences="459" value="è" /> + <ngram occurrences="325" value="ä" /> + <ngram occurrences="245" value="ñ" /> + <ngram occurrences="245" value="ð" /> + <ngram occurrences="202" value="ê" /> + <ngram occurrences="194" value="ë" /> + <ngram occurrences="175" value="í" /> + <ngram occurrences="171" value="ã" /> + <ngram occurrences="160" value="è_" /> + <ngram occurrences="159" value="ì" /> + <ngram occurrences="157" value="å" /> + <ngram occurrences="147" value="à_" /> + <ngram occurrences="118" value="ç" /> + <ngram occurrences="115" value="ó" /> + <ngram occurrences="115" value="á" /> + <ngram occurrences="114" value="ñ_" /> + <ngram occurrences="108" value="â" /> + <ngram occurrences="94" value="êè" /> + <ngram occurrences="90" value="þ" /> + <ngram occurrences="80" value="ãà" /> + <ngram occurrences="80" value="_ë" /> + <ngram occurrences="79" value="èñ" /> + <ngram occurrences="71" value="àð" /> + <ngram occurrences="70" value="ø" /> + <ngram occurrences="62" value="_à" /> + <ngram occurrences="60" value="àì" /> + <ngram occurrences="59" value="äá" /> + <ngram occurrences="58" value="ñà" /> + <ngram occurrences="53" value="ò" /> + <ngram occurrences="53" value="ëà" /> + <ngram occurrences="53" value="êè_" /> + <ngram occurrences="51" value="ú" /> + <ngram occurrences="51" value="âà" /> + <ngram occurrences="51" value="_ã" /> + <ngram occurrences="49" value="ðè" /> + <ngram occurrences="48" value="_â" /> + <ngram occurrences="47" value="_ñ" /> + <ngram occurrences="45" value="õ" /> + <ngram occurrences="42" value="èñ_" /> + <ngram occurrences="41" value="óê" /> + <ngram occurrences="41" value="äê" /> + <ngram occurrences="40" value="é" /> + <ngram occurrences="40" value="àå" /> + <ngram occurrences="40" value="_ãà" /> + <ngram occurrences="39" value="åà" /> + <ngram occurrences="39" value="ãà_" /> + <ngram occurrences="38" value="åä" /> + <ngram occurrences="38" value="äð" /> + <ngram occurrences="38" value="àë" /> + <ngram occurrences="37" value="ìè" /> + <ngram occurrences="36" value="ðà" /> + <ngram occurrences="36" value="_è" /> + <ngram occurrences="35" value="ô" /> + <ngram occurrences="35" value="èê" /> + <ngram occurrences="35" value="æ" /> + <ngram occurrences="35" value="àê" /> + <ngram occurrences="34" value="åè" /> + <ngram occurrences="33" value="ì_" /> + <ngram occurrences="33" value="_ø" /> + <ngram occurrences="32" value="ðí" /> + <ngram occurrences="32" value="áà" /> + <ngram occurrences="32" value="àã" /> + <ngram occurrences="31" value="_ð" /> + <ngram occurrences="30" value="ü" /> + <ngram occurrences="30" value="_âà" /> + <ngram occurrences="29" value="èç" /> + <ngram occurrences="29" value="äì" /> + <ngram occurrences="29" value="áè" /> + <ngram occurrences="29" value="àñ" /> + <ngram occurrences="29" value="_ä" /> + <ngram occurrences="27" value="ðç" /> + <ngram occurrences="26" value="íá" /> + <ngram occurrences="26" value="í_" /> + <ngram occurrences="26" value="çà" /> + <ngram occurrences="26" value="äñ" /> + <ngram occurrences="25" value="øè" /> + <ngram occurrences="25" value="ä_" /> + <ngram occurrences="25" value="ãä" /> + <ngram occurrences="25" value="_ç" /> + <ngram occurrences="24" value="óêè" /> + <ngram occurrences="24" value="ëí" /> + <ngram occurrences="24" value="êí" /> + <ngram occurrences="24" value="_ñà" /> + <ngram occurrences="24" value="_ëà" /> + <ngram occurrences="23" value="èà" /> + <ngram occurrences="23" value="_àð" /> + <ngram occurrences="22" value="þä" /> + <ngram occurrences="22" value="ëä" /> + <ngram occurrences="22" value="äêè" /> + <ngram occurrences="22" value="_þ" /> + <ngram occurrences="21" value="íð" /> + <ngram occurrences="21" value="ìä" /> + <ngram occurrences="21" value="èì" /> + <ngram occurrences="21" value="èêè" /> + <ngram occurrences="21" value="äáè" /> + <ngram occurrences="21" value="ã_" /> + <ngram occurrences="20" value="øè_" /> + <ngram occurrences="20" value="ö" /> + <ngram occurrences="20" value="óð" /> + <ngram occurrences="20" value="ñ_ë" /> + <ngram occurrences="20" value="èñà" /> + <ngram occurrences="20" value="à_ë" /> + <ngram occurrences="19" value="øä" /> + <ngram occurrences="19" value="óêè_" /> + <ngram occurrences="19" value="ðä" /> + <ngram occurrences="19" value="ëè" /> + <ngram occurrences="19" value="è_à" /> + <ngram occurrences="19" value="ç_" /> + <ngram occurrences="19" value="áà_" /> + <ngram occurrences="19" value="àì_" /> + <ngram occurrences="19" value="_á" /> + <ngram occurrences="18" value="þà" /> + <ngram occurrences="18" value="û" /> + <ngram occurrences="18" value="ðè_" /> + <ngram occurrences="18" value="äñ_" /> + <ngram occurrences="18" value="àìè" /> + <ngram occurrences="18" value="_øä" /> + <ngram occurrences="18" value="_ãà_" /> + <ngram occurrences="17" value="ð_" /> + <ngram occurrences="17" value="ìè_" /> + <ngram occurrences="17" value="ìã" /> + <ngram occurrences="17" value="êèñ" /> + <ngram occurrences="17" value="èà_" /> + <ngram occurrences="17" value="äë" /> + <ngram occurrences="17" value="äáà" /> + <ngram occurrences="17" value="à_â" /> + <ngram occurrences="17" value="_ó" /> + <ngram occurrences="16" value="íñ" /> + <ngram occurrences="16" value="ìà" /> + <ngram occurrences="16" value="êä" /> + <ngram occurrences="16" value="çè" /> + <ngram occurrences="16" value="àâ" /> + <ngram occurrences="16" value="_é" /> + <ngram occurrences="16" value="_å" /> + <ngram occurrences="15" value="þå" /> + <ngram occurrences="15" value="ú_" /> + <ngram occurrences="15" value="ù" /> + <ngram occurrences="15" value="êà" /> + <ngram occurrences="15" value="èêè_" /> + <ngram occurrences="15" value="è_ã" /> + <ngram occurrences="15" value="çå" /> + <ngram occurrences="15" value="àã_" /> + <ngram occurrences="15" value="à_à" /> + <ngram occurrences="15" value="_ü" /> + <ngram occurrences="14" value="ñþ" /> + <ngram occurrences="14" value="ëó" /> + <ngram occurrences="14" value="æä" /> + <ngram occurrences="14" value="äðç" /> + <ngram occurrences="14" value="à_ã" /> + <ngram occurrences="14" value="_ú" /> + <ngram occurrences="14" value="_ðí" /> + <ngram occurrences="14" value="_ëä" /> + <ngram occurrences="13" value="ñä" /> + <ngram occurrences="13" value="ñà_" /> + <ngram occurrences="13" value="î" /> + <ngram occurrences="13" value="íë" /> + <ngram occurrences="13" value="ë_" /> + <ngram occurrences="13" value="ê_" /> + <ngram occurrences="13" value="èð" /> + <ngram occurrences="13" value="çè_" /> + <ngram occurrences="13" value="åäê" /> + <ngram occurrences="13" value="âè" /> + <ngram occurrences="13" value="àþ" /> + <ngram occurrences="13" value="àðç" /> + <ngram occurrences="13" value="àêè" /> + <ngram occurrences="13" value="à_ãà" /> + <ngram occurrences="12" value="úþ" /> + <ngram occurrences="12" value="õà" /> + <ngram occurrences="12" value="ôä" /> + <ngram occurrences="12" value="ó_" /> + <ngram occurrences="12" value="òà" /> + <ngram occurrences="12" value="ñè" /> + <ngram occurrences="12" value="íáà" /> + <ngram occurrences="12" value="éà" /> + <ngram occurrences="12" value="è_ãà" /> + <ngram occurrences="12" value="åèñ" /> + <ngram occurrences="12" value="äã" /> + <ngram occurrences="12" value="äáà_" /> + <ngram occurrences="12" value="ãè" /> + <ngram occurrences="12" value="âàì" /> + <ngram occurrences="12" value="àõ" /> + <ngram occurrences="12" value="àñ_" /> + <ngram occurrences="12" value="àð_" /> + <ngram occurrences="12" value="àà" /> + <ngram occurrences="12" value="à_âà" /> + <ngram occurrences="12" value="_í" /> + <ngram occurrences="12" value="_äð" /> + <ngram occurrences="11" value="øà" /> + <ngram occurrences="11" value="ñ_ñ" /> + <ngram occurrences="11" value="ðäá" /> + <ngram occurrences="11" value="ëàð" /> + <ngram occurrences="11" value="èç_" /> + <ngram occurrences="11" value="èã" /> + <ngram occurrences="11" value="è_ñ" /> + <ngram occurrences="11" value="è_ë" /> + <ngram occurrences="11" value="è_è" /> + <ngram occurrences="11" value="çó" /> + <ngram occurrences="11" value="åê" /> + <ngram occurrences="11" value="äì_" /> + <ngram occurrences="11" value="äêè_" /> + <ngram occurrences="11" value="äå" /> + <ngram occurrences="11" value="âí" /> + <ngram occurrences="11" value="áä" /> + <ngram occurrences="11" value="àø" /> + <ngram occurrences="11" value="àðà" /> + <ngram occurrences="11" value="à_ñ" /> + <ngram occurrences="11" value="_ì" /> + <ngram occurrences="11" value="_ëí" /> + <ngram occurrences="11" value="_èñ" /> + <ngram occurrences="11" value="_äðç" /> + <ngram occurrences="11" value="_àð_" /> + <ngram occurrences="10" value="ôè" /> + <ngram occurrences="10" value="óðè" /> + <ngram occurrences="10" value="ñ_ëà" /> + <ngram occurrences="10" value="ðà_" /> + <ngram occurrences="10" value="íê" /> + <ngram occurrences="10" value="ìäá" /> + <ngram occurrences="10" value="êñ_" /> + <ngram occurrences="10" value="êñ" /> + <ngram occurrences="10" value="èõ" /> + <ngram occurrences="10" value="èñà_" /> + <ngram occurrences="10" value="èâ" /> + <ngram occurrences="10" value="è_ð" /> + <ngram occurrences="10" value="çõ" /> + <ngram occurrences="10" value="åàê" /> + <ngram occurrences="10" value="äô" /> + <ngram occurrences="10" value="äìè" /> + <ngram occurrences="10" value="àìè_" /> + <ngram occurrences="10" value="àè" /> + <ngram occurrences="10" value="àæ" /> + <ngram occurrences="10" value="_þà" /> + <ngram occurrences="10" value="_äñ" /> + <ngram occurrences="10" value="_àë" /> + <ngram occurrences="9" value="òè" /> + <ngram occurrences="9" value="òä" /> + <ngram occurrences="9" value="ñ_ç" /> + <ngram occurrences="9" value="ñ_ã" /> + <ngram occurrences="9" value="ðã" /> + <ngram occurrences="9" value="ìãà_" /> + <ngram occurrences="9" value="ìãà" /> + <ngram occurrences="9" value="éè" /> + <ngram occurrences="9" value="èú" /> + <ngram occurrences="9" value="çà_" /> + <ngram occurrences="9" value="åã" /> + <ngram occurrences="9" value="åà_" /> + <ngram occurrences="9" value="äôä" /> + <ngram occurrences="9" value="äç" /> + <ngram occurrences="9" value="âàì_" /> + <ngram occurrences="9" value="âàë" /> + <ngram occurrences="9" value="áó" /> + <ngram occurrences="9" value="áèñ" /> + <ngram occurrences="9" value="àú" /> + <ngram occurrences="9" value="àö" /> + <ngram occurrences="9" value="àò" /> + <ngram occurrences="9" value="àðè" /> + <ngram occurrences="9" value="àëí" /> + <ngram occurrences="9" value="àãà" /> + <ngram occurrences="9" value="àâà" /> + <ngram occurrences="9" value="_ô" /> + <ngram occurrences="9" value="_ñþ" /> + <ngram occurrences="9" value="_âàë" /> + <ngram occurrences="9" value="_àðà" /> + <ngram occurrences="8" value="þàê" /> + <ngram occurrences="8" value="õàðç" /> + <ngram occurrences="8" value="õàð" /> + <ngram occurrences="8" value="òí" /> + <ngram occurrences="8" value="ñþå" /> + <ngram occurrences="8" value="ñàþ" /> + <ngram occurrences="8" value="ñ_þ" /> + <ngram occurrences="8" value="ñ_ø" /> + <ngram occurrences="8" value="ñ_ãà" /> + <ngram occurrences="8" value="ñ_â" /> + <ngram occurrences="8" value="ðú" /> + <ngram occurrences="8" value="ìí" /> + <ngram occurrences="8" value="ëóê" /> + <ngram occurrences="8" value="ëäôä" /> + <ngram occurrences="8" value="ëäô" /> + <ngram occurrences="8" value="ëà_" /> + <ngram occurrences="8" value="êí_" /> + <ngram occurrences="8" value="êèñ_" /> + <ngram occurrences="8" value="êèà" /> + <ngram occurrences="8" value="èñ_ë" /> + <ngram occurrences="8" value="è_ø" /> + <ngram occurrences="8" value="è_ç" /> + <ngram occurrences="8" value="è_ä" /> + <ngram occurrences="8" value="è_ãà_" /> + <ngram occurrences="8" value="çàå" /> + <ngram occurrences="8" value="æä_" /> + <ngram occurrences="8" value="åñ" /> + <ngram occurrences="8" value="äáóê" /> + <ngram occurrences="8" value="äáó" /> + <ngram occurrences="8" value="ãð" /> + <ngram occurrences="8" value="âð" /> + <ngram occurrences="8" value="âè_" /> + <ngram occurrences="8" value="áóê" /> + <ngram occurrences="8" value="àô" /> + <ngram occurrences="8" value="àëè" /> + <ngram occurrences="8" value="àåè" /> + <ngram occurrences="8" value="àåà" /> + <ngram occurrences="8" value="ß" /> + <ngram occurrences="8" value="_øà" /> + <ngram occurrences="8" value="_ò" /> + <ngram occurrences="8" value="_çå" /> + <ngram occurrences="7" value="þí" /> + <ngram occurrences="7" value="þäê" /> + <ngram occurrences="7" value="üä" /> + <ngram occurrences="7" value="óì" /> + <ngram occurrences="7" value="ñò" /> + <ngram occurrences="7" value="ðèñ" /> + <ngram occurrences="7" value="ðçè_" /> + <ngram occurrences="7" value="ðçè" /> + <ngram occurrences="7" value="ðâ" /> + <ngram occurrences="7" value="îè" /> + <ngram occurrences="7" value="íñ_" /> + <ngram occurrences="7" value="íì" /> + <ngram occurrences="7" value="íêí" /> + <ngram occurrences="7" value="íã" /> + <ngram occurrences="7" value="íâ" /> + <ngram occurrences="7" value="íáà_" /> + <ngram occurrences="7" value="ì_ë" /> + <ngram occurrences="7" value="ëèê" /> + <ngram occurrences="7" value="ëàì" /> + <ngram occurrences="7" value="êèà_" /> + <ngram occurrences="7" value="èó" /> + <ngram occurrences="7" value="èìã" /> + <ngram occurrences="7" value="èé" /> + <ngram occurrences="7" value="èå" /> + <ngram occurrences="7" value="è_ü" /> + <ngram occurrences="7" value="è_â" /> + <ngram occurrences="7" value="è_àë" /> + <ngram occurrences="7" value="åèñ_" /> + <ngram occurrences="7" value="åèç" /> + <ngram occurrences="7" value="åäêè" /> + <ngram occurrences="7" value="äðçè_" /> + <ngram occurrences="7" value="äðçè" /> + <ngram occurrences="7" value="äáèñ" /> + <ngram occurrences="7" value="äáè_" /> + <ngram occurrences="7" value="ä_ë" /> + <ngram occurrences="7" value="ãâ" /> + <ngram occurrences="7" value="âàëí" /> + <ngram occurrences="7" value="âàã" /> + <ngram occurrences="7" value="áè_" /> + <ngram occurrences="7" value="àøè" /> + <ngram occurrences="7" value="àëà" /> + <ngram occurrences="7" value="àá" /> + <ngram occurrences="7" value="à_ñà" /> + <ngram occurrences="7" value="à_ëà" /> + <ngram occurrences="7" value="_ù" /> + <ngram occurrences="7" value="_õ" /> + <ngram occurrences="7" value="_ñàþ" /> + <ngram occurrences="7" value="_ðè" /> + <ngram occurrences="7" value="_ëäôä" /> + <ngram occurrences="7" value="_ëäô" /> + <ngram occurrences="7" value="_æ" /> + <ngram occurrences="7" value="_äñ_" /> + <ngram occurrences="7" value="_äðçè" /> + <ngram occurrences="7" value="_âàëí" /> + <ngram occurrences="6" value="þè" /> + <ngram occurrences="6" value="þåà" /> + <ngram occurrences="6" value="üè" /> + <ngram occurrences="6" value="úþä" /> + <ngram occurrences="6" value="ùä" /> + <ngram occurrences="6" value="øàëèê" /> + <ngram occurrences="6" value="øàëè" /> + <ngram occurrences="6" value="øàë" /> + <ngram occurrences="6" value="öå" /> + <ngram occurrences="6" value="õð" /> + <ngram occurrences="6" value="õå" /> + <ngram occurrences="6" value="ôê" /> + <ngram occurrences="6" value="óðè_" /> + <ngram occurrences="6" value="óê_" /> + <ngram occurrences="6" value="òè_" /> + <ngram occurrences="6" value="ñþåà" /> + <ngram occurrences="6" value="ñ_øä" /> + <ngram occurrences="6" value="ñ_à" /> + <ngram occurrences="6" value="ðíë" /> + <ngram occurrences="6" value="ðíá" /> + <ngram occurrences="6" value="ðë" /> + <ngram occurrences="6" value="ðçóê" /> + <ngram occurrences="6" value="ðçó" /> + <ngram occurrences="6" value="ðãà" /> + <ngram occurrences="6" value="ðàå" /> + <ngram occurrences="6" value="ðàã" /> + <ngram occurrences="6" value="íë_" /> + <ngram occurrences="6" value="íå" /> + <ngram occurrences="6" value="íä" /> + <ngram occurrences="6" value="íáè" /> + <ngram occurrences="6" value="ìèê" /> + <ngram occurrences="6" value="ëç" /> + <ngram occurrences="6" value="ëæ" /> + <ngram occurrences="6" value="ëã" /> + <ngram occurrences="6" value="êþ" /> + <ngram occurrences="6" value="êíá" /> + <ngram occurrences="6" value="êèñà" /> + <ngram occurrences="6" value="êäá" /> + <ngram occurrences="6" value="èò" /> + <ngram occurrences="6" value="èçà" /> + <ngram occurrences="6" value="è_ñà" /> +</ngrams> diff --git a/src/plugins/language/german.klp b/src/plugins/language/german.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="695" value="_" /> + <ngram occurrences="658" value="e" /> + <ngram occurrences="392" value="n" /> + <ngram occurrences="323" value="i" /> + <ngram occurrences="318" value="r" /> + <ngram occurrences="265" value="t" /> + <ngram occurrences="249" value="s" /> + <ngram occurrences="216" value="a" /> + <ngram occurrences="203" value="d" /> + <ngram occurrences="197" value="h" /> + <ngram occurrences="172" value="u" /> + <ngram occurrences="148" value="l" /> + <ngram occurrences="146" value="n_" /> + <ngram occurrences="141" value="er" /> + <ngram occurrences="140" value="en" /> + <ngram occurrences="132" value="e_" /> + <ngram occurrences="129" value="c" /> + <ngram occurrences="125" value="o" /> + <ngram occurrences="116" value="g" /> + <ngram occurrences="112" value="ch" /> + <ngram occurrences="110" value="m" /> + <ngram occurrences="105" value="_d" /> + <ngram occurrences="97" value="r_" /> + <ngram occurrences="92" value="en_" /> + <ngram occurrences="83" value="k" /> + <ngram occurrences="80" value="in" /> + <ngram occurrences="79" value="te" /> + <ngram occurrences="79" value="b" /> + <ngram occurrences="78" value="de" /> + <ngram occurrences="74" value="ei" /> + <ngram occurrences="73" value="f" /> + <ngram occurrences="71" value="_s" /> + <ngram occurrences="70" value="er_" /> + <ngram occurrences="67" value="_e" /> + <ngram occurrences="65" value="un" /> + <ngram occurrences="64" value="t_" /> + <ngram occurrences="54" value="ie" /> + <ngram occurrences="53" value="w" /> + <ngram occurrences="53" value="ge" /> + <ngram occurrences="52" value="_a" /> + <ngram occurrences="50" value="s_" /> + <ngram occurrences="49" value="nd" /> + <ngram occurrences="46" value="st" /> + <ngram occurrences="43" value="ng" /> + <ngram occurrences="42" value="z" /> + <ngram occurrences="42" value="der" /> + <ngram occurrences="42" value="_de" /> + <ngram occurrences="41" value="v" /> + <ngram occurrences="40" value="_i" /> + <ngram occurrences="39" value="re" /> + <ngram occurrences="39" value="m_" /> + <ngram occurrences="38" value="sch" /> + <ngram occurrences="38" value="sc" /> + <ngram occurrences="38" value="ne" /> + <ngram occurrences="38" value="di" /> + <ngram occurrences="37" value="he" /> + <ngram occurrences="36" value="d_" /> + <ngram occurrences="36" value="be" /> + <ngram occurrences="35" value="le" /> + <ngram occurrences="35" value="ie_" /> + <ngram occurrences="35" value="au" /> + <ngram occurrences="34" value="es" /> + <ngram occurrences="34" value="der_" /> + <ngram occurrences="33" value="it" /> + <ngram occurrences="33" value="h_" /> + <ngram occurrences="33" value="_w" /> + <ngram occurrences="32" value="ü" /> + <ngram occurrences="32" value="ein" /> + <ngram occurrences="31" value="p" /> + <ngram occurrences="30" value="ä" /> + <ngram occurrences="30" value="ti" /> + <ngram occurrences="30" value="ch_" /> + <ngram occurrences="30" value="_u" /> + <ngram occurrences="29" value="ic" /> + <ngram occurrences="29" value="_di" /> + <ngram occurrences="28" value="_f" /> + <ngram occurrences="28" value="_b" /> + <ngram occurrences="27" value="te_" /> + <ngram occurrences="27" value="nd_" /> + <ngram occurrences="27" value="die" /> + <ngram occurrences="27" value="an" /> + <ngram occurrences="27" value="_k" /> + <ngram occurrences="27" value="_die" /> + <ngram occurrences="27" value="_der" /> + <ngram occurrences="26" value="ung" /> + <ngram occurrences="26" value="si" /> + <ngram occurrences="26" value="or" /> + <ngram occurrences="26" value="nt" /> + <ngram occurrences="26" value="in_" /> + <ngram occurrences="26" value="_v" /> + <ngram occurrences="26" value="_g" /> + <ngram occurrences="26" value="_der_" /> + <ngram occurrences="25" value="is" /> + <ngram occurrences="25" value="ich" /> + <ngram occurrences="25" value="el" /> + <ngram occurrences="25" value="die_" /> + <ngram occurrences="25" value="al" /> + <ngram occurrences="25" value="_un" /> + <ngram occurrences="25" value="_h" /> + <ngram occurrences="25" value="_die_" /> + <ngram occurrences="24" value="_ein" /> + <ngram occurrences="24" value="_ei" /> + <ngram occurrences="23" value="und" /> + <ngram occurrences="23" value="on" /> + <ngram occurrences="23" value="che" /> + <ngram occurrences="22" value="se" /> + <ngram occurrences="22" value="rt" /> + <ngram occurrences="22" value="ra" /> + <ngram occurrences="22" value="me" /> + <ngram occurrences="22" value="li" /> + <ngram occurrences="22" value="at" /> + <ngram occurrences="22" value="_in" /> + <ngram occurrences="21" value="ten" /> + <ngram occurrences="21" value="ht" /> + <ngram occurrences="21" value="em" /> + <ngram occurrences="21" value="_er" /> + <ngram occurrences="20" value="ke" /> + <ngram occurrences="20" value="hr" /> + <ngram occurrences="20" value="_z" /> + <ngram occurrences="20" value="_au" /> + <ngram occurrences="19" value="ur" /> + <ngram occurrences="19" value="n_d" /> + <ngram occurrences="19" value="ll" /> + <ngram occurrences="19" value="da" /> + <ngram occurrences="19" value="_n" /> + <ngram occurrences="18" value="we" /> + <ngram occurrences="18" value="r_d" /> + <ngram occurrences="18" value="ine" /> + <ngram occurrences="18" value="im" /> + <ngram occurrences="18" value="g_" /> + <ngram occurrences="18" value="e_d" /> + <ngram occurrences="18" value="ar" /> + <ngram occurrences="17" value="und_" /> + <ngram occurrences="17" value="ter" /> + <ngram occurrences="17" value="ten_" /> + <ngram occurrences="17" value="ri" /> + <ngram occurrences="17" value="ns" /> + <ngram occurrences="17" value="gen" /> + <ngram occurrences="17" value="eit" /> + <ngram occurrences="17" value="eine" /> + <ngram occurrences="17" value="_da" /> + <ngram occurrences="17" value="_be" /> + <ngram occurrences="16" value="zu" /> + <ngram occurrences="16" value="nge" /> + <ngram occurrences="16" value="e_s" /> + <ngram occurrences="16" value="den" /> + <ngram occurrences="15" value="vo" /> + <ngram occurrences="15" value="ve" /> + <ngram occurrences="15" value="us" /> + <ngram occurrences="15" value="on_" /> + <ngram occurrences="15" value="ig" /> + <ngram occurrences="15" value="ht_" /> + <ngram occurrences="15" value="ha" /> + <ngram occurrences="15" value="fe" /> + <ngram occurrences="15" value="eu" /> + <ngram occurrences="15" value="cht" /> + <ngram occurrences="15" value="ab" /> + <ngram occurrences="15" value="_und_" /> + <ngram occurrences="15" value="_und" /> + <ngram occurrences="15" value="_t" /> + <ngram occurrences="15" value="_si" /> + <ngram occurrences="15" value="_m" /> + <ngram occurrences="15" value="_l" /> + <ngram occurrences="15" value="_in_" /> + <ngram occurrences="15" value="_ge" /> + <ngram occurrences="14" value="ö" /> + <ngram occurrences="14" value="rs" /> + <ngram occurrences="14" value="o_" /> + <ngram occurrences="14" value="n_de" /> + <ngram occurrences="14" value="mm" /> + <ngram occurrences="14" value="et" /> + <ngram occurrences="14" value="ach" /> + <ngram occurrences="14" value="ac" /> + <ngram occurrences="14" value="_sch" /> + <ngram occurrences="14" value="_sc" /> + <ngram occurrences="13" value="ür" /> + <ngram occurrences="13" value="ß" /> + <ngram occurrences="13" value="ze" /> + <ngram occurrences="13" value="wi" /> + <ngram occurrences="13" value="ver" /> + <ngram occurrences="13" value="ru" /> + <ngram occurrences="13" value="r_s" /> + <ngram occurrences="13" value="ng_" /> + <ngram occurrences="13" value="nde" /> + <ngram occurrences="13" value="n_s" /> + <ngram occurrences="13" value="men" /> + <ngram occurrences="13" value="ls" /> + <ngram occurrences="13" value="la" /> + <ngram occurrences="13" value="l_" /> + <ngram occurrences="13" value="he_" /> + <ngram occurrences="13" value="es_" /> + <ngram occurrences="13" value="ent" /> + <ngram occurrences="13" value="em_" /> + <ngram occurrences="13" value="eh" /> + <ngram occurrences="13" value="e_a" /> + <ngram occurrences="13" value="den_" /> + <ngram occurrences="13" value="_zu" /> + <ngram occurrences="13" value="_r" /> + <ngram occurrences="13" value="_eine" /> + <ngram occurrences="12" value="tr" /> + <ngram occurrences="12" value="ste" /> + <ngram occurrences="12" value="rn" /> + <ngram occurrences="12" value="na" /> + <ngram occurrences="12" value="n_w" /> + <ngram occurrences="12" value="lle" /> + <ngram occurrences="12" value="lic" /> + <ngram occurrences="12" value="ko" /> + <ngram occurrences="12" value="it_" /> + <ngram occurrences="12" value="ge_" /> + <ngram occurrences="12" value="fü" /> + <ngram occurrences="12" value="ers" /> + <ngram occurrences="12" value="as" /> + <ngram occurrences="12" value="am" /> + <ngram occurrences="12" value="_vo" /> + <ngram occurrences="12" value="_o" /> + <ngram occurrences="11" value="ür_" /> + <ngram occurrences="11" value="um" /> + <ngram occurrences="11" value="uf" /> + <ngram occurrences="11" value="tt" /> + <ngram occurrences="11" value="ta" /> + <ngram occurrences="11" value="so" /> + <ngram occurrences="11" value="rte" /> + <ngram occurrences="11" value="rk" /> + <ngram occurrences="11" value="ren" /> + <ngram occurrences="11" value="nte" /> + <ngram occurrences="11" value="no" /> + <ngram occurrences="11" value="nn" /> + <ngram occurrences="11" value="ni" /> + <ngram occurrences="11" value="lich" /> + <ngram occurrences="11" value="k_" /> + <ngram occurrences="11" value="hl" /> + <ngram occurrences="11" value="für_" /> + <ngram occurrences="11" value="für" /> + <ngram occurrences="11" value="ck" /> + <ngram occurrences="11" value="che_" /> + <ngram occurrences="11" value="auf" /> + <ngram occurrences="11" value="_ver" /> + <ngram occurrences="11" value="_ve" /> + <ngram occurrences="11" value="_ha" /> + <ngram occurrences="11" value="_für_" /> + <ngram occurrences="11" value="_für" /> + <ngram occurrences="11" value="_fü" /> + <ngram occurrences="10" value="ut" /> + <ngram occurrences="10" value="ung_" /> + <ngram occurrences="10" value="ts" /> + <ngram occurrences="10" value="sp" /> + <ngram occurrences="10" value="sin" /> + <ngram occurrences="10" value="s_e" /> + <ngram occurrences="10" value="rd" /> + <ngram occurrences="10" value="rc" /> + <ngram occurrences="10" value="n_u" /> + <ngram occurrences="10" value="n_der" /> + <ngram occurrences="10" value="n_a" /> + <ngram occurrences="10" value="ma" /> + <ngram occurrences="10" value="ls_" /> + <ngram occurrences="10" value="isch" /> + <ngram occurrences="10" value="isc" /> + <ngram occurrences="10" value="hi" /> + <ngram occurrences="10" value="gs" /> + <ngram occurrences="10" value="en_s" /> + <ngram occurrences="10" value="d_d" /> + <ngram occurrences="10" value="bei" /> + <ngram occurrences="10" value="als" /> + <ngram occurrences="10" value="_st" /> + <ngram occurrences="10" value="_se" /> + <ngram occurrences="9" value="ungs" /> + <ngram occurrences="9" value="um_" /> + <ngram occurrences="9" value="u_" /> + <ngram occurrences="9" value="t_e" /> + <ngram occurrences="9" value="sa" /> + <ngram occurrences="9" value="ren_" /> + <ngram occurrences="9" value="rch" /> + <ngram occurrences="9" value="r_e" /> + <ngram occurrences="9" value="om" /> + <ngram occurrences="9" value="ngs" /> + <ngram occurrences="9" value="nen" /> + <ngram occurrences="9" value="ne_" /> + <ngram occurrences="9" value="nder" /> + <ngram occurrences="9" value="n_e" /> + <ngram occurrences="9" value="mi" /> + <ngram occurrences="9" value="lt" /> + <ngram occurrences="9" value="le_" /> + <ngram occurrences="9" value="ind" /> + <ngram occurrences="9" value="in_d" /> + <ngram occurrences="9" value="im_" /> + <ngram occurrences="9" value="il" /> + <ngram occurrences="9" value="ik" /> + <ngram occurrences="9" value="ich_" /> + <ngram occurrences="9" value="hre" /> + <ngram occurrences="9" value="hen" /> + <ngram occurrences="9" value="gen_" /> + <ngram occurrences="9" value="ere" /> + <ngram occurrences="9" value="er_e" /> + <ngram occurrences="9" value="er_d" /> + <ngram occurrences="9" value="ein_" /> + <ngram occurrences="9" value="e_g" /> + <ngram occurrences="9" value="e_e" /> + <ngram occurrences="9" value="e_de" /> + <ngram occurrences="9" value="das" /> + <ngram occurrences="9" value="cht_" /> + <ngram occurrences="9" value="ba" /> + <ngram occurrences="9" value="als_" /> + <ngram occurrences="9" value="_wi" /> + <ngram occurrences="9" value="_we" /> + <ngram occurrences="9" value="_le" /> + <ngram occurrences="9" value="_ko" /> + <ngram occurrences="9" value="_in_d" /> + <ngram occurrences="9" value="_das" /> + <ngram occurrences="9" value="_al" /> + <ngram occurrences="8" value="wo" /> + <ngram occurrences="8" value="ute_" /> + <ngram occurrences="8" value="ute" /> + <ngram occurrences="8" value="urc" /> + <ngram occurrences="8" value="uc" /> + <ngram occurrences="8" value="tra" /> + <ngram occurrences="8" value="tig" /> + <ngram occurrences="8" value="th" /> + <ngram occurrences="8" value="ter_" /> + <ngram occurrences="8" value="sti" /> + <ngram occurrences="8" value="sich" /> + <ngram occurrences="8" value="sic" /> + <ngram occurrences="8" value="run" /> + <ngram occurrences="8" value="rei" /> + <ngram occurrences="8" value="ol" /> + <ngram occurrences="8" value="ner" /> + <ngram occurrences="8" value="nen_" /> + <ngram occurrences="8" value="nd_d" /> + <ngram occurrences="8" value="n_g" /> + <ngram occurrences="8" value="mme" /> + <ngram occurrences="8" value="leu" /> + <ngram occurrences="8" value="kei" /> + <ngram occurrences="8" value="j" /> + <ngram occurrences="8" value="ir" /> + <ngram occurrences="8" value="in_de" /> + <ngram occurrences="8" value="hen_" /> + <ngram occurrences="8" value="ft" /> + <ngram occurrences="8" value="f_" /> + <ngram occurrences="8" value="erk" /> + <ngram occurrences="8" value="eit_" /> + <ngram occurrences="8" value="du" /> + <ngram occurrences="8" value="do" /> + <ngram occurrences="8" value="das_" /> + <ngram occurrences="8" value="chen_" /> + <ngram occurrences="8" value="chen" /> + <ngram occurrences="8" value="ber" /> + <ngram occurrences="8" value="aus" /> + <ngram occurrences="8" value="as_" /> + <ngram occurrences="8" value="ad" /> + <ngram occurrences="8" value="_re" /> + <ngram occurrences="8" value="_p" /> + <ngram occurrences="8" value="_j" /> + <ngram occurrences="8" value="_das_" /> + <ngram occurrences="8" value="_auf" /> + <ngram occurrences="7" value="ß_" /> + <ngram occurrences="7" value="zu_" /> + <ngram occurrences="7" value="y" /> + <ngram occurrences="7" value="vor" /> + <ngram occurrences="7" value="von_" /> + <ngram occurrences="7" value="von" /> + <ngram occurrences="7" value="us_" /> + <ngram occurrences="7" value="urch" /> + <ngram occurrences="7" value="unge" /> + <ngram occurrences="7" value="uch" /> + <ngram occurrences="7" value="tte" /> + <ngram occurrences="7" value="to" /> + <ngram occurrences="7" value="t_h" /> + <ngram occurrences="7" value="t_d" /> + <ngram occurrences="7" value="rü" /> + <ngram occurrences="7" value="rt_" /> + <ngram occurrences="7" value="rde" /> + <ngram occurrences="7" value="r_die" /> + <ngram occurrences="7" value="r_di" /> + <ngram occurrences="7" value="r_a" /> + <ngram occurrences="7" value="od" /> + <ngram occurrences="7" value="n_un" /> + <ngram occurrences="7" value="n_k" /> + <ngram occurrences="7" value="n_i" /> + <ngram occurrences="7" value="n_b" /> + <ngram occurrences="7" value="men_" /> + <ngram occurrences="7" value="len" /> + <ngram occurrences="7" value="keit" /> + <ngram occurrences="7" value="ka" /> + <ngram occurrences="7" value="io" /> + <ngram occurrences="7" value="ing" /> + <ngram occurrences="7" value="ih" /> + <ngram occurrences="7" value="icht" /> + <ngram occurrences="7" value="hu" /> + <ngram occurrences="7" value="ho" /> + <ngram occurrences="7" value="hat" /> + <ngram occurrences="7" value="h_d" /> + <ngram occurrences="7" value="gr" /> + <ngram occurrences="7" value="ges" /> + <ngram occurrences="7" value="eute_" /> + <ngram occurrences="7" value="eute" /> + <ngram occurrences="7" value="eut" /> + <ngram occurrences="7" value="ert" /> + <ngram occurrences="7" value="er_s" /> + <ngram occurrences="7" value="ens" /> + <ngram occurrences="7" value="end" /> + <ngram occurrences="7" value="en_w" /> +</ngrams> diff --git a/src/plugins/language/greek.klp b/src/plugins/language/greek.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="854" value="_" /> + <ngram occurrences="366" value="á" /> + <ngram occurrences="298" value="ô" /> + <ngram occurrences="290" value="ï" /> + <ngram occurrences="258" value="å" /> + <ngram occurrences="244" value="í" /> + <ngram occurrences="236" value="é" /> + <ngram occurrences="193" value="ü" /> + <ngram occurrences="170" value="ð" /> + <ngram occurrences="162" value="ê" /> + <ngram occurrences="157" value="õ" /> + <ngram occurrences="153" value="ì" /> + <ngram occurrences="141" value="ó" /> + <ngram occurrences="132" value="ñ" /> + <ngram occurrences="128" value="ý" /> + <ngram occurrences="124" value="_ô" /> + <ngram occurrences="118" value="ç" /> + <ngram occurrences="116" value="ë" /> + <ngram occurrences="115" value="á_" /> + <ngram occurrences="97" value="ò_" /> + <ngram occurrences="97" value="ò" /> + <ngram occurrences="96" value="_ê" /> + <ngram occurrences="95" value="ïõ" /> + <ngram occurrences="91" value="í_" /> + <ngram occurrences="88" value="é_" /> + <ngram occurrences="85" value="ï_" /> + <ngram occurrences="82" value="ß" /> + <ngram occurrences="78" value="ôï" /> + <ngram occurrences="77" value="å_" /> + <ngram occurrences="76" value="_á" /> + <ngram occurrences="75" value="õ_" /> + <ngram occurrences="73" value="_ì" /> + <ngram occurrences="69" value="þ" /> + <ngram occurrences="62" value="_ó" /> + <ngram occurrences="61" value="_ð" /> + <ngram occurrences="60" value="ü_" /> + <ngram occurrences="60" value="ä" /> + <ngram occurrences="60" value="_ôï" /> + <ngram occurrences="59" value="ïõ_" /> + <ngram occurrences="59" value="ã" /> + <ngram occurrences="54" value="êá" /> + <ngram occurrences="54" value="_å" /> + <ngram occurrences="52" value="ù" /> + <ngram occurrences="52" value="ç_" /> + <ngram occurrences="49" value="íá" /> + <ngram occurrences="49" value="áí" /> + <ngram occurrences="45" value="_êá" /> + <ngram occurrences="44" value="ôç" /> + <ngram occurrences="40" value="óô" /> + <ngram occurrences="39" value="ôïõ" /> + <ngram occurrences="38" value="ôá" /> + <ngram occurrences="38" value="ðï" /> + <ngram occurrences="37" value="_ôïõ" /> + <ngram occurrences="36" value="_ý" /> + <ngram occurrences="35" value="åé" /> + <ngram occurrences="35" value="áé" /> + <ngram occurrences="34" value="ö" /> + <ngram occurrences="34" value="êü" /> + <ngram occurrences="34" value="_ä" /> + <ngram occurrences="33" value="ðü" /> + <ngram occurrences="33" value="áé_" /> + <ngram occurrences="32" value="è" /> + <ngram occurrences="31" value="ôé" /> + <ngram occurrences="31" value="ìð" /> + <ngram occurrences="31" value="â" /> + <ngram occurrences="31" value="_ï" /> + <ngram occurrences="30" value="íá_" /> + <ngram occurrences="29" value="ôïõ_" /> + <ngram occurrences="29" value="ìå" /> + <ngram occurrences="29" value="åß" /> + <ngram occurrences="29" value="_ôïõ_" /> + <ngram occurrences="28" value="ôü" /> + <ngram occurrences="28" value="ôï_" /> + <ngram occurrences="28" value="éï" /> + <ngram occurrences="28" value="áð" /> + <ngram occurrences="28" value="áí_" /> + <ngram occurrences="27" value="ýí" /> + <ngram occurrences="27" value="_ôç" /> + <ngram occurrences="27" value="_óô" /> + <ngram occurrences="25" value="ý_" /> + <ngram occurrences="25" value="_ã" /> + <ngram occurrences="24" value="üì" /> + <ngram occurrences="24" value="ðå" /> + <ngram occurrences="24" value="ïí" /> + <ngram occurrences="24" value="çí" /> + <ngram occurrences="23" value="î" /> + <ngram occurrences="23" value="íô" /> + <ngram occurrences="23" value="éá" /> + <ngram occurrences="23" value="çí_" /> + <ngram occurrences="23" value="æ" /> + <ngram occurrences="23" value="_í" /> + <ngram occurrences="22" value="þ_" /> + <ngram occurrences="22" value="óå" /> + <ngram occurrences="22" value="ñá" /> + <ngram occurrences="22" value="êáé_" /> + <ngram occurrences="22" value="êáé" /> + <ngram occurrences="22" value="_êü" /> + <ngram occurrences="22" value="_êáé_" /> + <ngram occurrences="22" value="_êáé" /> + <ngram occurrences="22" value="_áð" /> + <ngram occurrences="21" value="ü_ô" /> + <ngram occurrences="21" value="ìï" /> + <ngram occurrences="21" value="áò_" /> + <ngram occurrences="21" value="áò" /> + <ngram occurrences="21" value="áë" /> + <ngram occurrences="21" value="_ï_" /> + <ngram occurrences="21" value="_åß" /> + <ngram occurrences="20" value="ôå" /> + <ngram occurrences="20" value="ñü" /> + <ngram occurrences="19" value="üí" /> + <ngram occurrences="19" value="ù_" /> + <ngram occurrences="19" value="ôçí_" /> + <ngram occurrences="19" value="ôçí" /> + <ngram occurrences="19" value="ðé" /> + <ngram occurrences="19" value="íå" /> + <ngram occurrences="19" value="ìá" /> + <ngram occurrences="19" value="éê" /> + <ngram occurrences="19" value="ßí" /> + <ngram occurrences="19" value="_ôï_" /> + <ngram occurrences="18" value="ýñ" /> + <ngram occurrences="18" value="åñ" /> + <ngram occurrences="18" value="á_ô" /> + <ngram occurrences="18" value="_ü" /> + <ngram occurrences="18" value="_ðï" /> + <ngram occurrences="17" value="ñé" /> + <ngram occurrences="17" value="ðïõ" /> + <ngram occurrences="17" value="ìý" /> + <ngram occurrences="17" value="ëï" /> + <ngram occurrences="17" value="éá_" /> + <ngram occurrences="17" value="åé_" /> + <ngram occurrences="17" value="äå" /> + <ngram occurrences="17" value="_ë" /> + <ngram occurrences="16" value="üë" /> + <ngram occurrences="16" value="óå_" /> + <ngram occurrences="16" value="óá" /> + <ngram occurrences="16" value="ðïõ_" /> + <ngram occurrences="16" value="ìå_" /> + <ngram occurrences="16" value="ëé" /> + <ngram occurrences="16" value="éü" /> + <ngram occurrences="16" value="åí" /> + <ngram occurrences="16" value="áô" /> + <ngram occurrences="16" value="áðü" /> + <ngram occurrences="16" value="ß_" /> + <ngram occurrences="16" value="_ç" /> + <ngram occurrences="15" value="ôá_" /> + <ngram occurrences="15" value="ò_ô" /> + <ngram occurrences="15" value="ðß" /> + <ngram occurrences="15" value="ïý" /> + <ngram occurrences="15" value="ïé" /> + <ngram occurrences="15" value="ï_ð" /> + <ngram occurrences="15" value="íï" /> + <ngram occurrences="15" value="ëü" /> + <ngram occurrences="15" value="é_ô" /> + <ngram occurrences="15" value="çó" /> + <ngram occurrences="15" value="åô" /> + <ngram occurrences="15" value="á_ì" /> + <ngram occurrences="15" value="_ðïõ_" /> + <ngram occurrences="15" value="_ðïõ" /> + <ngram occurrences="15" value="_ç_" /> + <ngram occurrences="15" value="_áðü" /> + <ngram occurrences="14" value="ýíá" /> + <ngram occurrences="14" value="üô" /> + <ngram occurrences="14" value="ôü_" /> + <ngram occurrences="14" value="ðü_" /> + <ngram occurrences="14" value="ïí_" /> + <ngram occurrences="14" value="ï_ê" /> + <ngram occurrences="14" value="ëá" /> + <ngram occurrences="14" value="åí_" /> + <ngram occurrences="14" value="áñ" /> + <ngram occurrences="14" value="áðü_" /> + <ngram occurrences="14" value="á_ê" /> + <ngram occurrences="14" value="_íá" /> + <ngram occurrences="14" value="_ìð" /> + <ngram occurrences="14" value="_ìå" /> + <ngram occurrences="14" value="_äå" /> + <ngram occurrences="14" value="_áðü_" /> + <ngram occurrences="13" value="õô" /> + <ngram occurrences="13" value="ìü" /> + <ngram occurrences="13" value="êï" /> + <ngram occurrences="13" value="éï_" /> + <ngram occurrences="13" value="äåí_" /> + <ngram occurrences="13" value="äåí" /> + <ngram occurrences="13" value="_þ" /> + <ngram occurrences="13" value="_ñ" /> + <ngram occurrences="13" value="_íá_" /> + <ngram occurrences="13" value="_ìï" /> + <ngram occurrences="13" value="_äåí_" /> + <ngram occurrences="13" value="_äåí" /> + <ngram occurrences="12" value="üìð" /> + <ngram occurrences="12" value="õò_" /> + <ngram occurrences="12" value="õò" /> + <ngram occurrences="12" value="õí" /> + <ngram occurrences="12" value="õ_ê" /> + <ngram occurrences="12" value="ñá_" /> + <ngram occurrences="12" value="ðéï" /> + <ngram occurrences="12" value="ïõò_" /> + <ngram occurrences="12" value="ïõò" /> + <ngram occurrences="12" value="íç" /> + <ngram occurrences="12" value="í_ô" /> + <ngram occurrences="12" value="í_ê" /> + <ngram occurrences="12" value="ìïõ" /> + <ngram occurrences="12" value="ç_ì" /> + <ngram occurrences="12" value="áõ" /> + <ngram occurrences="12" value="á_ôï" /> + <ngram occurrences="12" value="ßð" /> + <ngram occurrences="12" value="_ôçí_" /> + <ngram occurrences="12" value="_ôçí" /> + <ngram occurrences="12" value="_ðü" /> + <ngram occurrences="12" value="_áí" /> + <ngram occurrences="11" value="óôï" /> + <ngram occurrences="11" value="ñï" /> + <ngram occurrences="11" value="ðå_" /> + <ngram occurrences="11" value="ïõ_ê" /> + <ngram occurrences="11" value="ïò_" /> + <ngram occurrences="11" value="ïò" /> + <ngram occurrences="11" value="îå" /> + <ngram occurrences="11" value="í_á" /> + <ngram occurrences="11" value="ìé" /> + <ngram occurrences="11" value="ëå" /> + <ngram occurrences="11" value="êüì" /> + <ngram occurrences="11" value="êé" /> + <ngram occurrences="11" value="å_á" /> + <ngram occurrences="11" value="áõô" /> + <ngram occurrences="11" value="áó" /> + <ngram occurrences="11" value="á_ó" /> + <ngram occurrences="11" value="_ö" /> + <ngram occurrences="11" value="_î" /> + <ngram occurrences="11" value="_ìé" /> + <ngram occurrences="11" value="_â" /> + <ngram occurrences="11" value="_áõô" /> + <ngram occurrences="11" value="_áõ" /> + <ngram occurrences="10" value="ýó" /> + <ngram occurrences="10" value="ü_ôï" /> + <ngram occurrences="10" value="ôý" /> + <ngram occurrences="10" value="ôõ" /> + <ngram occurrences="10" value="ôç_" /> + <ngram occurrences="10" value="óôç" /> + <ngram occurrences="10" value="ò_ó" /> + <ngram occurrences="10" value="ò_å" /> + <ngram occurrences="10" value="ñå" /> + <ngram occurrences="10" value="ìýí" /> + <ngram occurrences="10" value="êüìð" /> + <ngram occurrences="10" value="êü_" /> + <ngram occurrences="10" value="êñ" /> + <ngram occurrences="10" value="êå" /> + <ngram occurrences="10" value="é_ôï" /> + <ngram occurrences="10" value="åò_" /> + <ngram occurrences="10" value="åò" /> + <ngram occurrences="10" value="åßðå_" /> + <ngram occurrences="10" value="åßðå" /> + <ngram occurrences="10" value="åßð" /> + <ngram occurrences="10" value="å_ô" /> + <ngram occurrences="10" value="äé" /> + <ngram occurrences="10" value="á_êá" /> + <ngram occurrences="10" value="ßðå_" /> + <ngram occurrences="10" value="ßðå" /> + <ngram occurrences="10" value="ßá" /> + <ngram occurrences="10" value="_óôï" /> + <ngram occurrences="10" value="_óôç" /> + <ngram occurrences="10" value="_êüìð" /> + <ngram occurrences="10" value="_êüì" /> + <ngram occurrences="10" value="_åßðå" /> + <ngram occurrences="10" value="_åßð" /> + <ngram occurrences="9" value="þô" /> + <ngram occurrences="9" value="ýíá_" /> + <ngram occurrences="9" value="üò_" /> + <ngram occurrences="9" value="üò" /> + <ngram occurrences="9" value="üñ" /> + <ngram occurrences="9" value="ôõ_" /> + <ngram occurrences="9" value="ôñ" /> + <ngram occurrences="9" value="ôïõò_" /> + <ngram occurrences="9" value="ôïõò" /> + <ngram occurrences="9" value="ôé_" /> + <ngram occurrences="9" value="ôå_" /> + <ngram occurrences="9" value="ôáí_" /> + <ngram occurrences="9" value="ôáí" /> + <ngram occurrences="9" value="óôï_" /> + <ngram occurrences="9" value="óç" /> + <ngram occurrences="9" value="ò_á" /> + <ngram occurrences="9" value="ðñ" /> + <ngram occurrences="9" value="ïé_" /> + <ngram occurrences="9" value="íôõ_" /> + <ngram occurrences="9" value="íôõ" /> + <ngram occurrences="9" value="ìðé" /> + <ngram occurrences="9" value="ëë" /> + <ngram occurrences="9" value="êáô" /> + <ngram occurrences="9" value="êáí" /> + <ngram occurrences="9" value="éü_" /> + <ngram occurrences="9" value="éó" /> + <ngram occurrences="9" value="éò_" /> + <ngram occurrences="9" value="éò" /> + <ngram occurrences="9" value="éêü" /> + <ngram occurrences="9" value="é_ï" /> + <ngram occurrences="9" value="á_ôïõ" /> + <ngram occurrences="9" value="_êáô" /> + <ngram occurrences="9" value="_é" /> + <ngram occurrences="8" value="ýë" /> + <ngram occurrences="8" value="üìðé" /> + <ngram occurrences="8" value="ü_ê" /> + <ngram occurrences="8" value="õì" /> + <ngram occurrences="8" value="õ_á" /> + <ngram occurrences="8" value="ôéê" /> + <ngram occurrences="8" value="ðüí" /> + <ngram occurrences="8" value="ðßíôõ" /> + <ngram occurrences="8" value="ðßíô" /> + <ngram occurrences="8" value="ðßí" /> + <ngram occurrences="8" value="ïë" /> + <ngram occurrences="8" value="ï_ô" /> + <ngram occurrences="8" value="îå_" /> + <ngram occurrences="8" value="í_ì" /> + <ngram occurrences="8" value="ìðßíô" /> + <ngram occurrences="8" value="ìðßí" /> + <ngram occurrences="8" value="ìðß" /> + <ngram occurrences="8" value="ìïõ_" /> + <ngram occurrences="8" value="êüìðé" /> + <ngram occurrences="8" value="éêü_" /> + <ngram occurrences="8" value="é_á" /> + <ngram occurrences="8" value="çô" /> + <ngram occurrences="8" value="åë" /> + <ngram occurrences="8" value="åã" /> + <ngram occurrences="8" value="ãé" /> + <ngram occurrences="8" value="áì" /> + <ngram occurrences="8" value="áê" /> + <ngram occurrences="8" value="áé_ô" /> + <ngram occurrences="8" value="á_å" /> + <ngram occurrences="8" value="ßíôõ_" /> + <ngram occurrences="8" value="ßíôõ" /> + <ngram occurrences="8" value="ßíô" /> + <ngram occurrences="8" value="_ôïõò" /> + <ngram occurrences="8" value="_ôá" /> + <ngram occurrences="8" value="_óôï_" /> + <ngram occurrences="8" value="_ìðßí" /> + <ngram occurrences="8" value="_ìðß" /> + <ngram occurrences="8" value="_ìá" /> + <ngram occurrences="7" value="üìðéï" /> + <ngram occurrences="7" value="ü_ôïõ" /> + <ngram occurrences="7" value="ü_ôç" /> + <ngram occurrences="7" value="ùò_" /> + <ngram occurrences="7" value="ùò" /> + <ngram occurrences="7" value="õôü" /> + <ngram occurrences="7" value="õð" /> + <ngram occurrences="7" value="õ_ý" /> + <ngram occurrences="7" value="õ_êá" /> + <ngram occurrences="7" value="óù" /> + <ngram occurrences="7" value="óôçí_" /> + <ngram occurrences="7" value="óôçí" /> + <ngram occurrences="7" value="óï" /> + <ngram occurrences="7" value="óç_" /> + <ngram occurrences="7" value="óáí_" /> + <ngram occurrences="7" value="óáí" /> + <ngram occurrences="7" value="ò_ê" /> + <ngram occurrences="7" value="ðü_ô" /> + <ngram occurrences="7" value="ðéïí_" /> + <ngram occurrences="7" value="ðéïí" /> + <ngram occurrences="7" value="ïõ_êá" /> + <ngram occurrences="7" value="ïñ" /> + <ngram occurrences="7" value="íù" /> + <ngram occurrences="7" value="íç_" /> + <ngram occurrences="7" value="í_êá" /> + <ngram occurrences="7" value="ìðéïí" /> + <ngram occurrences="7" value="ìðéï" /> + <ngram occurrences="7" value="ìá_" /> + <ngram occurrences="7" value="ëþ" /> + <ngram occurrences="7" value="êáé_ô" /> + <ngram occurrences="7" value="ê_" /> + <ngram occurrences="7" value="éïí_" /> + <ngram occurrences="7" value="éïí" /> + <ngram occurrences="7" value="éí" /> + <ngram occurrences="7" value="éë" /> + <ngram occurrences="7" value="é_ì" /> + <ngram occurrences="7" value="èá" /> + <ngram occurrences="7" value="ç_ìðß" /> + <ngram occurrences="7" value="ç_ìð" /> + <ngram occurrences="7" value="ãá" /> + <ngram occurrences="7" value="âá" /> + <ngram occurrences="7" value="áðü_ô" /> + <ngram occurrences="7" value="á_óô" /> + <ngram occurrences="7" value="_ý_" /> + <ngram occurrences="7" value="_ôç_" /> + <ngram occurrences="7" value="_ôá_" /> + <ngram occurrences="7" value="_óôçí" /> + <ngram occurrences="7" value="_óá" /> + <ngram occurrences="7" value="_ï_ê" /> + <ngram occurrences="7" value="_ìïõ" /> + <ngram occurrences="7" value="_êé" /> + <ngram occurrences="7" value="_è" /> + <ngram occurrences="7" value="_ç_ìð" /> + <ngram occurrences="7" value="_ç_ì" /> + <ngram occurrences="7" value="_ãé" /> + <ngram occurrences="7" value="_áì" /> + <ngram occurrences="6" value="ýì" /> + <ngram occurrences="6" value="üôé" /> + <ngram occurrences="6" value="ü_ó" /> + <ngram occurrences="6" value="õ_ì" /> + <ngram occurrences="6" value="ôþ" /> + <ngram occurrences="6" value="ôïí" /> + <ngram occurrences="6" value="ôéêü_" /> + <ngram occurrences="6" value="ôéêü" /> + <ngram occurrences="6" value="ôçò_" /> + <ngram occurrences="6" value="ôçò" /> +</ngrams> diff --git a/src/plugins/language/hawaian.klp b/src/plugins/language/hawaian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1106" value="_" /> + <ngram occurrences="781" value="a" /> + <ngram occurrences="386" value="a_" /> + <ngram occurrences="357" value="k" /> + <ngram occurrences="345" value="o" /> + <ngram occurrences="340" value="i" /> + <ngram occurrences="277" value="e" /> + <ngram occurrences="232" value="_k" /> + <ngram occurrences="210" value="u" /> + <ngram occurrences="195" value="n" /> + <ngram occurrences="195" value="h" /> + <ngram occurrences="194" value="i_" /> + <ngram occurrences="192" value="l" /> + <ngram occurrences="182" value="e_" /> + <ngram occurrences="163" value="o_" /> + <ngram occurrences="144" value="ka" /> + <ngram occurrences="141" value="m" /> + <ngram occurrences="136" value="_a" /> + <ngram occurrences="127" value="_i" /> + <ngram occurrences="109" value="_ka" /> + <ngram occurrences="97" value="_h" /> + <ngram occurrences="95" value="ô" /> + <ngram occurrences="95" value="ma" /> + <ngram occurrences="95" value="_m" /> + <ngram occurrences="88" value="p" /> + <ngram occurrences="79" value="ua" /> + <ngram occurrences="79" value="na" /> + <ngram occurrences="78" value="_o" /> + <ngram occurrences="77" value="_n" /> + <ngram occurrences="73" value="_i_" /> + <ngram occurrences="68" value="ke" /> + <ngram occurrences="66" value="_a_" /> + <ngram occurrences="64" value="ä" /> + <ngram occurrences="64" value="u_" /> + <ngram occurrences="61" value="ÿ" /> + <ngram occurrences="61" value="ak" /> + <ngram occurrences="61" value="_ma" /> + <ngram occurrences="60" value="_o_" /> + <ngram occurrences="59" value="na_" /> + <ngram occurrences="59" value="ho" /> + <ngram occurrences="59" value="_l" /> + <ngram occurrences="58" value="ai" /> + <ngram occurrences="56" value="ka_" /> + <ngram occurrences="56" value="i_k" /> + <ngram occurrences="55" value="ua_" /> + <ngram occurrences="55" value="o_k" /> + <ngram occurrences="54" value="ke_" /> + <ngram occurrences="53" value="a_h" /> + <ngram occurrences="53" value="_p" /> + <ngram occurrences="52" value="e_k" /> + <ngram occurrences="51" value="an" /> + <ngram occurrences="50" value="ah" /> + <ngram occurrences="48" value="le" /> + <ngram occurrences="46" value="la" /> + <ngram occurrences="46" value="au" /> + <ngram occurrences="46" value="a_m" /> + <ngram occurrences="44" value="lo" /> + <ngram occurrences="44" value="_ô" /> + <ngram occurrences="43" value="ko" /> + <ngram occurrences="43" value="a_i" /> + <ngram occurrences="42" value="_ke" /> + <ngram occurrences="41" value="a_k" /> + <ngram occurrences="40" value="a_a" /> + <ngram occurrences="40" value="_ka_" /> + <ngram occurrences="39" value="no" /> + <ngram occurrences="39" value="ku" /> + <ngram occurrences="39" value="hi" /> + <ngram occurrences="39" value="_i_k" /> + <ngram occurrences="38" value="ia" /> + <ngram occurrences="38" value="ha" /> + <ngram occurrences="38" value="e_a" /> + <ngram occurrences="37" value="ôo" /> + <ngram occurrences="37" value="le_" /> + <ngram occurrences="37" value="ana" /> + <ngram occurrences="36" value="ä_" /> + <ngram occurrences="36" value="ol" /> + <ngram occurrences="36" value="o_ka" /> + <ngram occurrences="36" value="a_o" /> + <ngram occurrences="35" value="pu" /> + <ngram occurrences="35" value="_ke_" /> + <ngram occurrences="34" value="ai_" /> + <ngram occurrences="33" value="la_" /> + <ngram occurrences="33" value="ia_" /> + <ngram occurrences="33" value="he" /> + <ngram occurrences="33" value="_e" /> + <ngram occurrences="31" value="_ko" /> + <ngram occurrences="30" value="ôa" /> + <ngram occurrences="30" value="w" /> + <ngram occurrences="30" value="ana_" /> + <ngram occurrences="30" value="am" /> + <ngram occurrences="30" value="a_o_" /> + <ngram occurrences="30" value="_o_k" /> + <ngram occurrences="29" value="ik" /> + <ngram occurrences="29" value="el" /> + <ngram occurrences="29" value="al" /> + <ngram occurrences="29" value="a_i_" /> + <ngram occurrences="29" value="_ÿ" /> + <ngram occurrences="29" value="_ho" /> + <ngram occurrences="28" value="ne" /> + <ngram occurrences="28" value="ho_" /> + <ngram occurrences="28" value="ahi" /> + <ngram occurrences="28" value="a_a_" /> + <ngram occurrences="27" value="a_n" /> + <ngram occurrences="27" value="_e_" /> + <ngram occurrences="26" value="pua" /> + <ngram occurrences="26" value="au_" /> + <ngram occurrences="26" value="_he" /> + <ngram occurrences="25" value="me" /> + <ngram occurrences="25" value="ki" /> + <ngram occurrences="25" value="kam" /> + <ngram occurrences="25" value="a_ma" /> + <ngram occurrences="24" value="wa" /> + <ngram occurrences="24" value="o_i" /> + <ngram occurrences="24" value="aô" /> + <ngram occurrences="24" value="ama" /> + <ngram occurrences="24" value="_ôo" /> + <ngram occurrences="24" value="_kam" /> + <ngram occurrences="23" value="oh" /> + <ngram occurrences="23" value="in" /> + <ngram occurrences="23" value="i_i" /> + <ngram occurrences="23" value="i_a" /> + <ngram occurrences="23" value="e_ka" /> + <ngram occurrences="23" value="aku" /> + <ngram occurrences="23" value="_u" /> + <ngram occurrences="22" value="on" /> + <ngram occurrences="22" value="kama" /> + <ngram occurrences="22" value="kah" /> + <ngram occurrences="22" value="ele" /> + <ngram occurrences="22" value="a_ka" /> + <ngram occurrences="22" value="_o_ka" /> + <ngram occurrences="22" value="_ia" /> + <ngram occurrences="22" value="_ak" /> + <ngram occurrences="21" value="ôo_" /> + <ngram occurrences="21" value="pa" /> + <ngram occurrences="21" value="mak" /> + <ngram occurrences="21" value="ele_" /> + <ngram occurrences="21" value="ei" /> + <ngram occurrences="21" value="a_p" /> + <ngram occurrences="21" value="_no" /> + <ngram occurrences="21" value="_kama" /> + <ngram occurrences="21" value="_ia_" /> + <ngram occurrences="20" value="ôi" /> + <ngram occurrences="20" value="mai" /> + <ngram occurrences="20" value="ea_" /> + <ngram occurrences="20" value="ea" /> + <ngram occurrences="20" value="_me" /> + <ngram occurrences="20" value="_mai" /> + <ngram occurrences="20" value="_lo" /> + <ngram occurrences="20" value="_ha" /> + <ngram occurrences="19" value="ÿo" /> + <ngram occurrences="19" value="ke_k" /> + <ngram occurrences="19" value="k_" /> + <ngram occurrences="19" value="iki" /> + <ngram occurrences="19" value="i_ka" /> + <ngram occurrences="19" value="_aku" /> + <ngram occurrences="18" value="ul" /> + <ngram occurrences="18" value="oô" /> + <ngram occurrences="18" value="ok" /> + <ngram occurrences="18" value="o_o" /> + <ngram occurrences="18" value="o_a" /> + <ngram occurrences="18" value="ma_" /> + <ngram occurrences="18" value="lä" /> + <ngram occurrences="18" value="hi_" /> + <ngram occurrences="18" value="he_" /> + <ngram occurrences="18" value="e_i" /> + <ngram occurrences="18" value="apu" /> + <ngram occurrences="18" value="ap" /> + <ngram occurrences="18" value="ake" /> + <ngram occurrences="18" value="a_o_k" /> + <ngram occurrences="18" value="_na" /> + <ngram occurrences="18" value="_k_" /> + <ngram occurrences="17" value="ne_" /> + <ngram occurrences="17" value="ki_" /> + <ngram occurrences="17" value="ke_a" /> + <ngram occurrences="17" value="kahi" /> + <ngram occurrences="17" value="iä_" /> + <ngram occurrences="17" value="iä" /> + <ngram occurrences="17" value="i_m" /> + <ngram occurrences="17" value="i_i_" /> + <ngram occurrences="17" value="aka" /> + <ngram occurrences="17" value="a_l" /> + <ngram occurrences="17" value="_ôo_" /> + <ngram occurrences="17" value="_iä_" /> + <ngram occurrences="17" value="_iä" /> + <ngram occurrences="16" value="oa" /> + <ngram occurrences="16" value="o_kam" /> + <ngram occurrences="16" value="iki_" /> + <ngram occurrences="16" value="apua" /> + <ngram occurrences="16" value="_mak" /> + <ngram occurrences="16" value="_kah" /> + <ngram occurrences="16" value="_a_h" /> + <ngram occurrences="15" value="ÿa" /> + <ngram occurrences="15" value="no_" /> + <ngram occurrences="15" value="a_ô" /> + <ngram occurrences="15" value="a_he" /> + <ngram occurrences="15" value="_pu" /> + <ngram occurrences="15" value="_ke_a" /> + <ngram occurrences="14" value="ôa_" /> + <ngram occurrences="14" value="ua_a" /> + <ngram occurrences="14" value="oho" /> + <ngram occurrences="14" value="na_o_" /> + <ngram occurrences="14" value="na_o" /> + <ngram occurrences="14" value="mapua" /> + <ngram occurrences="14" value="mapu" /> + <ngram occurrences="14" value="map" /> + <ngram occurrences="14" value="kamap" /> + <ngram occurrences="14" value="ih" /> + <ngram occurrences="14" value="i_n" /> + <ngram occurrences="14" value="amapu" /> + <ngram occurrences="14" value="amap" /> + <ngram occurrences="14" value="ahi_" /> + <ngram occurrences="14" value="a_me" /> + <ngram occurrences="14" value="a_i_k" /> + <ngram occurrences="14" value="a_ha" /> + <ngram occurrences="14" value="a_e" /> + <ngram occurrences="14" value="_w" /> + <ngram occurrences="14" value="_ne" /> + <ngram occurrences="14" value="_lä" /> + <ngram occurrences="14" value="_ke_k" /> + <ngram occurrences="14" value="_i_ka" /> + <ngram occurrences="13" value="ÿi" /> + <ngram occurrences="13" value="ôi_" /> + <ngram occurrences="13" value="ua_a_" /> + <ngram occurrences="13" value="u_i" /> + <ngram occurrences="13" value="pua_a" /> + <ngram occurrences="13" value="pua_" /> + <ngram occurrences="13" value="ole" /> + <ngram occurrences="13" value="oho_" /> + <ngram occurrences="13" value="o_p" /> + <ngram occurrences="13" value="noho_" /> + <ngram occurrences="13" value="noho" /> + <ngram occurrences="13" value="noh" /> + <ngram occurrences="13" value="make" /> + <ngram occurrences="13" value="lu" /> + <ngram occurrences="13" value="li" /> + <ngram occurrences="13" value="kau" /> + <ngram occurrences="13" value="i_h" /> + <ngram occurrences="13" value="i_a_" /> + <ngram occurrences="13" value="ei_" /> + <ngram occurrences="13" value="aôa" /> + <ngram occurrences="13" value="_ôa" /> + <ngram occurrences="13" value="_wa" /> + <ngram occurrences="13" value="_noho" /> + <ngram occurrences="13" value="_noh" /> + <ngram occurrences="13" value="_kau" /> + <ngram occurrences="13" value="_he_" /> + <ngram occurrences="13" value="_ana_" /> + <ngram occurrences="13" value="_ana" /> + <ngram occurrences="13" value="_an" /> + <ngram occurrences="12" value="oa_" /> + <ngram occurrences="12" value="o_ia_" /> + <ngram occurrences="12" value="o_ia" /> + <ngram occurrences="12" value="nä" /> + <ngram occurrences="12" value="nu" /> + <ngram occurrences="12" value="n_" /> + <ngram occurrences="12" value="me_" /> + <ngram occurrences="12" value="make_" /> + <ngram occurrences="12" value="kua" /> + <ngram occurrences="12" value="ka_m" /> + <ngram occurrences="12" value="il" /> + <ngram occurrences="12" value="iho" /> + <ngram occurrences="12" value="i_ma" /> + <ngram occurrences="12" value="i_ke_" /> + <ngram occurrences="12" value="i_ke" /> + <ngram occurrences="12" value="hu" /> + <ngram occurrences="12" value="hiki" /> + <ngram occurrences="12" value="hik" /> + <ngram occurrences="12" value="h_" /> + <ngram occurrences="12" value="e_n" /> + <ngram occurrences="12" value="apua_" /> + <ngram occurrences="12" value="ake_" /> + <ngram occurrences="12" value="a_ÿ" /> + <ngram occurrences="12" value="a_ho" /> + <ngram occurrences="12" value="_me_" /> + <ngram occurrences="12" value="_ma_" /> + <ngram occurrences="12" value="_ka_m" /> + <ngram occurrences="11" value="äua_" /> + <ngram occurrences="11" value="äua" /> + <ngram occurrences="11" value="äu" /> + <ngram occurrences="11" value="ula" /> + <ngram occurrences="11" value="uaôa" /> + <ngram occurrences="11" value="uaô" /> + <ngram occurrences="11" value="puaôa" /> + <ngram occurrences="11" value="puaô" /> + <ngram occurrences="11" value="ole_" /> + <ngram occurrences="11" value="o_o_" /> + <ngram occurrences="11" value="o_ka_" /> + <ngram occurrences="11" value="nei_" /> + <ngram occurrences="11" value="nei" /> + <ngram occurrences="11" value="na_i" /> + <ngram occurrences="11" value="mau" /> + <ngram occurrences="11" value="lo_" /> + <ngram occurrences="11" value="ko_" /> + <ngram occurrences="11" value="ke_ka" /> + <ngram occurrences="11" value="i_ko" /> + <ngram occurrences="11" value="i_ka_" /> + <ngram occurrences="11" value="ha_" /> + <ngram occurrences="11" value="e_h" /> + <ngram occurrences="11" value="aÿ" /> + <ngram occurrences="11" value="aôa_" /> + <ngram occurrences="11" value="aha" /> + <ngram occurrences="11" value="a_no" /> + <ngram occurrences="11" value="_ÿo" /> + <ngram occurrences="11" value="_n_" /> + <ngram occurrences="11" value="_make" /> + <ngram occurrences="11" value="_kahi" /> + <ngram occurrences="11" value="_e_k" /> + <ngram occurrences="11" value="_ai" /> + <ngram occurrences="11" value="_a_k" /> + <ngram occurrences="10" value="ë" /> + <ngram occurrences="10" value="un" /> + <ngram occurrences="10" value="ua_i" /> + <ngram occurrences="10" value="u_k" /> + <ngram occurrences="10" value="pe" /> + <ngram occurrences="10" value="ona_" /> + <ngram occurrences="10" value="ona" /> + <ngram occurrences="10" value="olo" /> + <ngram occurrences="10" value="nä_" /> + <ngram occurrences="10" value="l_" /> + <ngram occurrences="10" value="kul" /> + <ngram occurrences="10" value="kai" /> + <ngram occurrences="10" value="kahi_" /> + <ngram occurrences="10" value="ino" /> + <ngram occurrences="10" value="hoô" /> + <ngram occurrences="10" value="ho_i" /> + <ngram occurrences="10" value="hiki_" /> + <ngram occurrences="10" value="e_m" /> + <ngram occurrences="10" value="e_ke" /> + <ngram occurrences="10" value="e_a_" /> + <ngram occurrences="10" value="a_ôo" /> + <ngram occurrences="10" value="a_u" /> + <ngram occurrences="10" value="a_ke" /> + <ngram occurrences="10" value="a_he_" /> + <ngram occurrences="10" value="_pua" /> + <ngram occurrences="10" value="_pa" /> + <ngram occurrences="10" value="_l_" /> + <ngram occurrences="10" value="_hoô" /> + <ngram occurrences="10" value="_h_" /> + <ngram occurrences="9" value="ÿo_" /> + <ngram occurrences="9" value="ö" /> + <ngram occurrences="9" value="ôo_k" /> + <ngram occurrences="9" value="ä_k" /> + <ngram occurrences="9" value="wai" /> + <ngram occurrences="9" value="ula_" /> + <ngram occurrences="9" value="uk" /> + <ngram occurrences="9" value="uaôa_" /> + <ngram occurrences="9" value="u_m" /> + <ngram occurrences="9" value="u_i_" /> + <ngram occurrences="9" value="po" /> + <ngram occurrences="9" value="oÿ" /> + <ngram occurrences="9" value="ou" /> + <ngram occurrences="9" value="oe" /> + <ngram occurrences="9" value="o_i_" /> + <ngram occurrences="9" value="ni" /> + <ngram occurrences="9" value="na_h" /> + <ngram occurrences="9" value="mo" /> + <ngram occurrences="9" value="mai_" /> + <ngram occurrences="9" value="loa" /> + <ngram occurrences="9" value="le_a" /> + <ngram occurrences="9" value="kula" /> + <ngram occurrences="9" value="kaua_" /> + <ngram occurrences="9" value="kaua" /> + <ngram occurrences="9" value="i_ô" /> + <ngram occurrences="9" value="i_o" /> + <ngram occurrences="9" value="i_l" /> + <ngram occurrences="9" value="i_i_k" /> + <ngram occurrences="9" value="hel" /> + <ngram occurrences="9" value="e_ma" /> + <ngram occurrences="9" value="e_kau" /> + <ngram occurrences="9" value="e_i_" /> + <ngram occurrences="9" value="aua_" /> + <ngram occurrences="9" value="aua" /> + <ngram occurrences="9" value="ana_o" /> + <ngram occurrences="9" value="akula" /> + <ngram occurrences="9" value="akul" /> + <ngram occurrences="9" value="akua" /> + <ngram occurrences="9" value="a_ôo_" /> + <ngram occurrences="9" value="a_me_" /> + <ngram occurrences="9" value="a_e_" /> + <ngram occurrences="9" value="a_a_h" /> + <ngram occurrences="9" value="_ua_" /> + <ngram occurrences="9" value="_ua" /> + <ngram occurrences="9" value="_pe" /> + <ngram occurrences="9" value="_nei_" /> + <ngram occurrences="9" value="_nei" /> + <ngram occurrences="9" value="_mai_" /> + <ngram occurrences="9" value="_ku" /> + <ngram occurrences="9" value="_kaua" /> + <ngram occurrences="9" value="_i_ko" /> + <ngram occurrences="9" value="_akul" /> + <ngram occurrences="9" value="_a_m" /> + <ngram occurrences="8" value="ÿe" /> + <ngram occurrences="8" value="ü" /> + <ngram occurrences="8" value="ôo_ka" /> + <ngram occurrences="8" value="u_ma" /> + <ngram occurrences="8" value="oôi" /> + <ngram occurrences="8" value="op" /> + <ngram occurrences="8" value="oe_" /> + <ngram occurrences="8" value="o_ke" /> + <ngram occurrences="8" value="o_a_" /> +</ngrams> diff --git a/src/plugins/language/hebrew.klp b/src/plugins/language/hebrew.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="591" value="_" /> + <ngram occurrences="296" value="é" /> + <ngram occurrences="260" value="å" /> + <ngram occurrences="226" value="ä" /> + <ngram occurrences="167" value="ø" /> + <ngram occurrences="155" value="ì" /> + <ngram occurrences="153" value="ú" /> + <ngram occurrences="121" value="á" /> + <ngram occurrences="120" value="ù" /> + <ngram occurrences="119" value="ä_" /> + <ngram occurrences="118" value="î" /> + <ngram occurrences="112" value="à" /> + <ngram occurrences="97" value="ð" /> + <ngram occurrences="96" value="_ú" /> + <ngram occurrences="89" value="ò" /> + <ngram occurrences="79" value="ã" /> + <ngram occurrences="78" value="í" /> + <ngram occurrences="78" value="_í" /> + <ngram occurrences="75" value="_ä" /> + <ngram occurrences="63" value="á_" /> + <ngram occurrences="57" value="ç" /> + <ngram occurrences="56" value="_ì" /> + <ngram occurrences="55" value="úå" /> + <ngram occurrences="54" value="ë" /> + <ngram occurrences="51" value="ô" /> + <ngram occurrences="51" value="íé" /> + <ngram occurrences="51" value="ì_" /> + <ngram occurrences="51" value="_íé" /> + <ngram occurrences="48" value="ñ" /> + <ngram occurrences="48" value="_ø" /> + <ngram occurrences="46" value="î_" /> + <ngram occurrences="46" value="_é" /> + <ngram occurrences="45" value="_úå" /> + <ngram occurrences="40" value="_å" /> + <ngram occurrences="39" value="â" /> + <ngram occurrences="37" value="ò_" /> + <ngram occurrences="37" value="à_" /> + <ngram occurrences="36" value="ù_" /> + <ngram occurrences="35" value="è" /> + <ngram occurrences="34" value="éð" /> + <ngram occurrences="30" value="ö" /> + <ngram occurrences="29" value="ï" /> + <ngram occurrences="29" value="é_" /> + <ngram occurrences="29" value="_ï" /> + <ngram occurrences="28" value="ø_" /> + <ngram occurrences="28" value="ë_" /> + <ngram occurrences="27" value="_ã" /> + <ngram occurrences="26" value="åð" /> + <ngram occurrences="24" value="ìù" /> + <ngram occurrences="24" value="ä_ú" /> + <ngram occurrences="23" value="åø" /> + <ngram occurrences="23" value="åé" /> + <ngram occurrences="22" value="éã" /> + <ngram occurrences="21" value="å_" /> + <ngram occurrences="20" value="ð_" /> + <ngram occurrences="19" value="øå" /> + <ngram occurrences="19" value="éá" /> + <ngram occurrences="19" value="æ" /> + <ngram occurrences="19" value="äì" /> + <ngram occurrences="18" value="ðé" /> + <ngram occurrences="18" value="éø" /> + <ngram occurrences="18" value="åù" /> + <ngram occurrences="18" value="àø" /> + <ngram occurrences="17" value="úé" /> + <ngram occurrences="17" value="úà" /> + <ngram occurrences="17" value="ùé" /> + <ngram occurrences="17" value="øù" /> + <ngram occurrences="17" value="ðå" /> + <ngram occurrences="17" value="îä_" /> + <ngram occurrences="17" value="îä" /> + <ngram occurrences="17" value="åá" /> + <ngram occurrences="16" value="ìù_" /> + <ngram occurrences="16" value="éé" /> + <ngram occurrences="16" value="éä" /> + <ngram occurrences="15" value="ú_" /> + <ngram occurrences="15" value="øä" /> + <ngram occurrences="15" value="éî" /> + <ngram occurrences="15" value="ä_é" /> + <ngram occurrences="15" value="á_ä" /> + <ngram occurrences="15" value="_úé" /> + <ngram occurrences="15" value="_ìù" /> + <ngram occurrences="14" value="ïé" /> + <ngram occurrences="14" value="ìå" /> + <ngram occurrences="14" value="éò" /> + <ngram occurrences="14" value="éì" /> + <ngram occurrences="14" value="åî" /> + <ngram occurrences="14" value="äð" /> + <ngram occurrences="14" value="äé" /> + <ngram occurrences="14" value="ä_ø" /> + <ngram occurrences="14" value="_úà" /> + <ngram occurrences="14" value="_ïé" /> + <ngram occurrences="14" value="_ìù_" /> + <ngram occurrences="14" value="_á" /> + <ngram occurrences="13" value="øé" /> + <ngram occurrences="13" value="ìò" /> + <ngram occurrences="13" value="éù" /> + <ngram occurrences="13" value="åò" /> + <ngram occurrences="13" value="åä" /> + <ngram occurrences="13" value="ä_ä" /> + <ngram occurrences="12" value="ô_" /> + <ngram occurrences="12" value="î_í" /> + <ngram occurrences="12" value="éë" /> + <ngram occurrences="12" value="åç" /> + <ngram occurrences="12" value="ä_í" /> + <ngram occurrences="12" value="ä_ì" /> + <ngram occurrences="11" value="úéð" /> + <ngram occurrences="11" value="úà_" /> + <ngram occurrences="11" value="øà" /> + <ngram occurrences="11" value="ôä" /> + <ngram occurrences="11" value="éè" /> + <ngram occurrences="11" value="ãé" /> + <ngram occurrences="11" value="_úéð" /> + <ngram occurrences="11" value="_ù" /> + <ngram occurrences="11" value="_ìò" /> + <ngram occurrences="11" value="_éð" /> + <ngram occurrences="11" value="_äð" /> + <ngram occurrences="10" value="úåð" /> + <ngram occurrences="10" value="ùà" /> + <ngram occurrences="10" value="øú" /> + <ngram occurrences="10" value="øç" /> + <ngram occurrences="10" value="øä_" /> + <ngram occurrences="10" value="ìò_" /> + <ngram occurrences="10" value="ìà" /> + <ngram occurrences="10" value="éô" /> + <ngram occurrences="10" value="éñ" /> + <ngram occurrences="10" value="éá_" /> + <ngram occurrences="10" value="ç_" /> + <ngram occurrences="10" value="åú" /> + <ngram occurrences="10" value="ä_íé" /> + <ngram occurrences="10" value="ãå" /> + <ngram occurrences="10" value="àä_" /> + <ngram occurrences="10" value="àä" /> + <ngram occurrences="10" value="_øå" /> + <ngram occurrences="10" value="_ò" /> + <ngram occurrences="10" value="_ìò_" /> + <ngram occurrences="10" value="_äì" /> + <ngram occurrences="10" value="_à" /> + <ngram occurrences="9" value="úåø" /> + <ngram occurrences="9" value="ùø" /> + <ngram occurrences="9" value="ùî" /> + <ngram occurrences="9" value="ùå" /> + <ngram occurrences="9" value="ôä_" /> + <ngram occurrences="9" value="òä" /> + <ngram occurrences="9" value="ò_ú" /> + <ngram occurrences="9" value="íò" /> + <ngram occurrences="9" value="ì_í" /> + <ngram occurrences="9" value="ì_ä" /> + <ngram occurrences="9" value="ê" /> + <ngram occurrences="9" value="éö" /> + <ngram occurrences="9" value="éðå" /> + <ngram occurrences="9" value="åë" /> + <ngram occurrences="9" value="äø" /> + <ngram occurrences="9" value="äì_" /> + <ngram occurrences="9" value="ãî" /> + <ngram occurrences="9" value="ãá" /> + <ngram occurrences="9" value="áé" /> + <ngram occurrences="9" value="á_ú" /> + <ngram occurrences="9" value="_íò" /> + <ngram occurrences="9" value="_ê" /> + <ngram occurrences="9" value="_åð" /> + <ngram occurrences="9" value="_äø" /> + <ngram occurrences="9" value="_äé" /> + <ngram occurrences="8" value="úî" /> + <ngram occurrences="8" value="úä" /> + <ngram occurrences="8" value="ùé_" /> + <ngram occurrences="8" value="òá" /> + <ngram occurrences="8" value="ò_úå" /> + <ngram occurrences="8" value="ñå" /> + <ngram occurrences="8" value="ïå" /> + <ngram occurrences="8" value="îå" /> + <ngram occurrences="8" value="î_íé" /> + <ngram occurrences="8" value="íò_" /> + <ngram occurrences="8" value="ìë" /> + <ngram occurrences="8" value="ì_å" /> + <ngram occurrences="8" value="ë_ú" /> + <ngram occurrences="8" value="éâ" /> + <ngram occurrences="8" value="éà" /> + <ngram occurrences="8" value="çà" /> + <ngram occurrences="8" value="åô" /> + <ngram occurrences="8" value="åé_" /> + <ngram occurrences="8" value="åå" /> + <ngram occurrences="8" value="åà" /> + <ngram occurrences="8" value="â_" /> + <ngram occurrences="8" value="áå" /> + <ngram occurrences="8" value="á_í" /> + <ngram occurrences="8" value="àå" /> + <ngram occurrences="8" value="àá" /> + <ngram occurrences="8" value="_úåø" /> + <ngram occurrences="8" value="_úåð" /> + <ngram occurrences="8" value="_úà_" /> + <ngram occurrences="8" value="_ïå" /> + <ngram occurrences="8" value="_íò_" /> + <ngram occurrences="7" value="úåù" /> + <ngram occurrences="7" value="úåé" /> + <ngram occurrences="7" value="ùàø" /> + <ngram occurrences="7" value="øçà" /> + <ngram occurrences="7" value="ö_" /> + <ngram occurrences="7" value="ó" /> + <ngram occurrences="7" value="òô" /> + <ngram occurrences="7" value="òå" /> + <ngram occurrences="7" value="òä_" /> + <ngram occurrences="7" value="ñì" /> + <ngram occurrences="7" value="ðá" /> + <ngram occurrences="7" value="î_ú" /> + <ngram occurrences="7" value="íéø" /> + <ngram occurrences="7" value="íéã" /> + <ngram occurrences="7" value="ìô" /> + <ngram occurrences="7" value="ìé" /> + <ngram occurrences="7" value="ìàø" /> + <ngram occurrences="7" value="ì_ú" /> + <ngram occurrences="7" value="ì_íé" /> + <ngram occurrences="7" value="ë_úå" /> + <ngram occurrences="7" value="éðé" /> + <ngram occurrences="7" value="éë_" /> + <ngram occurrences="7" value="èñ" /> + <ngram occurrences="7" value="è_" /> + <ngram occurrences="7" value="åã" /> + <ngram occurrences="7" value="åâ" /> + <ngram occurrences="7" value="äù" /> + <ngram occurrences="7" value="äá" /> + <ngram occurrences="7" value="ä_úå" /> + <ngram occurrences="7" value="ãò" /> + <ngram occurrences="7" value="áø" /> + <ngram occurrences="7" value="à_ä" /> + <ngram occurrences="7" value="_úåù" /> + <ngram occurrences="7" value="_ó" /> + <ngram occurrences="7" value="_íéø" /> + <ngram occurrences="7" value="_íéã" /> + <ngram occurrences="7" value="_ç" /> + <ngram occurrences="6" value="úù" /> + <ngram occurrences="6" value="úø" /> + <ngram occurrences="6" value="úä_" /> + <ngram occurrences="6" value="ù_é" /> + <ngram occurrences="6" value="øùé" /> + <ngram occurrences="6" value="øì" /> + <ngram occurrences="6" value="øè" /> + <ngram occurrences="6" value="øã" /> + <ngram occurrences="6" value="ø_ì" /> + <ngram occurrences="6" value="öä_" /> + <ngram occurrences="6" value="öä" /> + <ngram occurrences="6" value="ò_í" /> + <ngram occurrences="6" value="ñä" /> + <ngram occurrences="6" value="ðù" /> + <ngram occurrences="6" value="ïéé" /> + <ngram occurrences="6" value="îì" /> + <ngram occurrences="6" value="î_ä" /> + <ngram occurrences="6" value="íéì" /> + <ngram occurrences="6" value="ìàøùé" /> + <ngram occurrences="6" value="ìàøù" /> + <ngram occurrences="6" value="ëå" /> + <ngram occurrences="6" value="éèñì" /> + <ngram occurrences="6" value="éèñ" /> + <ngram occurrences="6" value="éç" /> + <ngram occurrences="6" value="éå" /> + <ngram occurrences="6" value="éãé" /> + <ngram occurrences="6" value="èñì" /> + <ngram occurrences="6" value="çî" /> + <ngram occurrences="6" value="æ_" /> + <ngram occurrences="6" value="åò_" /> + <ngram occurrences="6" value="åæ" /> + <ngram occurrences="6" value="äî" /> + <ngram occurrences="6" value="ä_å" /> + <ngram occurrences="6" value="á_ø" /> + <ngram occurrences="6" value="àù" /> + <ngram occurrences="6" value="àøùé" /> + <ngram occurrences="6" value="àøù" /> + <ngram occurrences="6" value="àì_" /> + <ngram occurrences="6" value="àì" /> + <ngram occurrences="6" value="àá_" /> + <ngram occurrences="6" value="_úø" /> + <ngram occurrences="6" value="_ø_" /> + <ngram occurrences="6" value="_ïéé" /> + <ngram occurrences="6" value="_î" /> + <ngram occurrences="6" value="_íéì" /> + <ngram occurrences="6" value="_ìà" /> + <ngram occurrences="6" value="_éë_" /> + <ngram occurrences="6" value="_éë" /> + <ngram occurrences="6" value="_ä_" /> + <ngram occurrences="5" value="úð" /> + <ngram occurrences="5" value="úåùø" /> + <ngram occurrences="5" value="ùì_" /> + <ngram occurrences="5" value="ùì" /> + <ngram occurrences="5" value="ù_ï" /> + <ngram occurrences="5" value="ù_í" /> + <ngram occurrences="5" value="øúå" /> + <ngram occurrences="5" value="øù_" /> + <ngram occurrences="5" value="øà_" /> + <ngram occurrences="5" value="ø_ú" /> + <ngram occurrences="5" value="öò" /> + <ngram occurrences="5" value="öå" /> + <ngram occurrences="5" value="òî" /> + <ngram occurrences="5" value="òé" /> + <ngram occurrences="5" value="òá_" /> + <ngram occurrences="5" value="ñìô" /> + <ngram occurrences="5" value="ñä_" /> + <ngram occurrences="5" value="ñà" /> + <ngram occurrences="5" value="ðî" /> + <ngram occurrences="5" value="ðéãî" /> + <ngram occurrences="5" value="ðéã" /> + <ngram occurrences="5" value="îî" /> + <ngram occurrences="5" value="îé" /> + <ngram occurrences="5" value="îá_" /> + <ngram occurrences="5" value="îá" /> + <ngram occurrences="5" value="íéð" /> + <ngram occurrences="5" value="íâ_" /> + <ngram occurrences="5" value="íâ" /> + <ngram occurrences="5" value="ëä_" /> + <ngram occurrences="5" value="ëä" /> + <ngram occurrences="5" value="ë_ä" /> + <ngram occurrences="5" value="éú" /> + <ngram occurrences="5" value="éñå" /> + <ngram occurrences="5" value="éèñìô" /> + <ngram occurrences="5" value="éä_" /> + <ngram occurrences="5" value="éãî" /> + <ngram occurrences="5" value="é_ú" /> + <ngram occurrences="5" value="èñìô" /> + <ngram occurrences="5" value="èá" /> + <ngram occurrences="5" value="çî_" /> + <ngram occurrences="5" value="çé" /> + <ngram occurrences="5" value="çå" /> + <ngram occurrences="5" value="åùø" /> + <ngram occurrences="5" value="åö" /> + <ngram occurrences="5" value="åñ" /> + <ngram occurrences="5" value="åðé" /> + <ngram occurrences="5" value="åð_" /> + <ngram occurrences="5" value="åá_" /> + <ngram occurrences="5" value="ä_úà" /> + <ngram occurrences="5" value="ä_øå" /> + <ngram occurrences="5" value="ãò_" /> + <ngram occurrences="5" value="ã_" /> + <ngram occurrences="5" value="âô" /> + <ngram occurrences="5" value="âé" /> + <ngram occurrences="5" value="âä" /> + <ngram occurrences="5" value="áä_" /> + <ngram occurrences="5" value="áä" /> + <ngram occurrences="5" value="á_å" /> + <ngram occurrences="5" value="á_äì" /> + <ngram occurrences="5" value="àø_" /> + <ngram occurrences="5" value="àî" /> + <ngram occurrences="5" value="àé" /> + <ngram occurrences="5" value="à_ú" /> + <ngram occurrences="5" value="à_í" /> + <ngram occurrences="5" value="_úåùø" /> + <ngram occurrences="5" value="_úåé" /> + <ngram occurrences="5" value="_ùà" /> + <ngram occurrences="5" value="_ñ" /> + <ngram occurrences="5" value="_íéð" /> + <ngram occurrences="5" value="_íâ_" /> + <ngram occurrences="5" value="_íâ" /> + <ngram occurrences="5" value="_ìå" /> + <ngram occurrences="5" value="_ìàøù" /> + <ngram occurrences="5" value="_ìàø" /> + <ngram occurrences="5" value="_ì_" /> + <ngram occurrences="5" value="_åú" /> + <ngram occurrences="5" value="_äá" /> + <ngram occurrences="5" value="_ãå" /> + <ngram occurrences="5" value="_áé" /> + <ngram occurrences="4" value="úî_" /> + <ngram occurrences="4" value="úì" /> + <ngram occurrences="4" value="úéðéè" /> + <ngram occurrences="4" value="úéðé" /> + <ngram occurrences="4" value="úåùøä" /> + <ngram occurrences="4" value="úåá" /> + <ngram occurrences="4" value="ùú" /> + <ngram occurrences="4" value="ùøä_" /> + <ngram occurrences="4" value="ùøä" /> + <ngram occurrences="4" value="ùôà" /> + <ngram occurrences="4" value="ùô" /> + <ngram occurrences="4" value="ùîî" /> + <ngram occurrences="4" value="ùéâ" /> + <ngram occurrences="4" value="ùàø_" /> + <ngram occurrences="4" value="ù_ú" /> + <ngram occurrences="4" value="ù_íé" /> + <ngram occurrences="4" value="ù_ìù_" /> + <ngram occurrences="4" value="ù_ìù" /> + <ngram occurrences="4" value="ù_ì" /> + <ngram occurrences="4" value="ù_ä" /> + <ngram occurrences="4" value="øùôà" /> + <ngram occurrences="4" value="øùô" /> + <ngram occurrences="4" value="øùé_" /> + <ngram occurrences="4" value="øö" /> + <ngram occurrences="4" value="øî" /> + <ngram occurrences="4" value="øì_" /> + <ngram occurrences="4" value="ø_í" /> + <ngram occurrences="4" value="ø_å" /> + <ngram occurrences="4" value="õ" /> + <ngram occurrences="4" value="ôø" /> + <ngram occurrences="4" value="ôî" /> + <ngram occurrences="4" value="ôì" /> + <ngram occurrences="4" value="ôä_ú" /> + <ngram occurrences="4" value="ôà" /> + <ngram occurrences="4" value="ò_ø" /> + <ngram occurrences="4" value="ò_íé" /> + <ngram occurrences="4" value="ñî" /> + <ngram occurrences="4" value="ñìôä_" /> + <ngram occurrences="4" value="ñìôä" /> + <ngram occurrences="4" value="ñé" /> + <ngram occurrences="4" value="ñ_" /> + <ngram occurrences="4" value="ðú" /> + <ngram occurrences="4" value="ðéèñì" /> +</ngrams> diff --git a/src/plugins/language/hindi.klp b/src/plugins/language/hindi.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1062" value="_" /> + <ngram occurrences="417" value="æ" /> + <ngram occurrences="366" value="u" /> + <ngram occurrences="259" value="ð" /> + <ngram occurrences="178" value="â" /> + <ngram occurrences="171" value="æ_" /> + <ngram occurrences="169" value="ð_" /> + <ngram occurrences="167" value="ú" /> + <ngram occurrences="162" value="ç" /> + <ngram occurrences="160" value="úu" /> + <ngram occurrences="154" value="u_" /> + <ngram occurrences="150" value="è" /> + <ngram occurrences="144" value="_æ" /> + <ngram occurrences="135" value="ü" /> + <ngram occurrences="134" value="_â" /> + <ngram occurrences="110" value="ù" /> + <ngram occurrences="109" value="è_" /> + <ngram occurrences="109" value="ã" /> + <ngram occurrences="102" value="_ç" /> + <ngram occurrences="89" value="ø" /> + <ngram occurrences="80" value="ì" /> + <ngram occurrences="79" value="¸" /> + <ngram occurrences="76" value="_ð" /> + <ngram occurrences="72" value="úu_" /> + <ngram occurrences="68" value="_ã" /> + <ngram occurrences="65" value="ãu" /> + <ngram occurrences="60" value="ß" /> + <ngram occurrences="60" value="_ü" /> + <ngram occurrences="60" value="_ú" /> + <ngram occurrences="58" value="ü_" /> + <ngram occurrences="56" value="ô" /> + <ngram occurrences="56" value="_úu" /> + <ngram occurrences="55" value="î" /> + <ngram occurrences="54" value="_ð_" /> + <ngram occurrences="53" value="¸_" /> + <ngram occurrences="53" value="_æ_" /> + <ngram occurrences="46" value="õ" /> + <ngram occurrences="45" value="â_" /> + <ngram occurrences="44" value="ù_" /> + <ngram occurrences="43" value="ñ" /> + <ngram occurrences="43" value="é" /> + <ngram occurrences="43" value="æð" /> + <ngram occurrences="43" value="uæ" /> + <ngram occurrences="42" value="á" /> + <ngram occurrences="41" value="ç_" /> + <ngram occurrences="39" value="uè" /> + <ngram occurrences="37" value="æúu" /> + <ngram occurrences="37" value="æú" /> + <ngram occurrences="34" value="_ø" /> + <ngram occurrences="34" value="_õ" /> + <ngram occurrences="33" value="à" /> + <ngram occurrences="33" value="_ù" /> + <ngram occurrences="33" value="_ì" /> + <ngram occurrences="33" value="_â_" /> + <ngram occurrences="31" value="ô_" /> + <ngram occurrences="31" value="ð¸" /> + <ngram occurrences="31" value="ì_" /> + <ngram occurrences="30" value="_è" /> + <ngram occurrences="30" value="_ãu" /> + <ngram occurrences="29" value="ð_â" /> + <ngram occurrences="29" value="ãñ" /> + <ngram occurrences="29" value="_ãñ" /> + <ngram occurrences="28" value="ñu" /> + <ngram occurrences="28" value="uè_" /> + <ngram occurrences="28" value="_ç_" /> + <ngram occurrences="27" value="øæ" /> + <ngram occurrences="27" value="ð¸_" /> + <ngram occurrences="27" value="ãñu" /> + <ngram occurrences="27" value="u_æ" /> + <ngram occurrences="27" value="_ãñu" /> + <ngram occurrences="26" value="ø_" /> + <ngram occurrences="26" value="ð_ç" /> + <ngram occurrences="26" value="æü" /> + <ngram occurrences="26" value="å" /> + <ngram occurrences="25" value="úuæ" /> + <ngram occurrences="25" value="ö" /> + <ngram occurrences="25" value="_u" /> + <ngram occurrences="24" value="àæ" /> + <ngram occurrences="24" value="_é" /> + <ngram occurrences="23" value="ï" /> + <ngram occurrences="23" value="âæ" /> + <ngram occurrences="23" value="_î" /> + <ngram occurrences="23" value="_è_" /> + <ngram occurrences="22" value="æ_ã" /> + <ngram occurrences="22" value="ãu_" /> + <ngram occurrences="22" value="_ß" /> + <ngram occurrences="21" value="ùð_" /> + <ngram occurrences="21" value="ùð" /> + <ngram occurrences="21" value="ê" /> + <ngram occurrences="21" value="æù" /> + <ngram occurrences="21" value="uæ_" /> + <ngram occurrences="21" value="_ö" /> + <ngram occurrences="21" value="_æð" /> + <ngram occurrences="20" value="ý" /> + <ngram occurrences="20" value="í" /> + <ngram occurrences="20" value="é_" /> + <ngram occurrences="20" value="ææ" /> + <ngram occurrences="20" value="âð" /> + <ngram occurrences="20" value="¹" /> + <ngram occurrences="20" value="uð_" /> + <ngram occurrences="20" value="uð" /> + <ngram occurrences="20" value="u_ç" /> + <ngram occurrences="20" value="_ô" /> + <ngram occurrences="20" value="_æúu" /> + <ngram occurrences="20" value="_æú" /> + <ngram occurrences="19" value="¸u" /> + <ngram occurrences="19" value="è_â" /> + <ngram occurrences="19" value="æ_æ" /> + <ngram occurrences="19" value="s" /> + <ngram occurrences="19" value="_ü_" /> + <ngram occurrences="18" value="üð" /> + <ngram occurrences="18" value="ìæ" /> + <ngram occurrences="18" value="æð_" /> + <ngram occurrences="18" value="_úu_" /> + <ngram occurrences="18" value="_ð¸" /> + <ngram occurrences="18" value="_á" /> + <ngram occurrences="17" value="üæ" /> + <ngram occurrences="17" value="øæ_" /> + <ngram occurrences="17" value="ô¸" /> + <ngram occurrences="17" value="ð_æ" /> + <ngram occurrences="17" value="ßæ" /> + <ngram occurrences="17" value="uô" /> + <ngram occurrences="17" value="u_â" /> + <ngram occurrences="17" value="_ð¸_" /> + <ngram occurrences="16" value="ô¸_" /> + <ngram occurrences="16" value="ñuð_" /> + <ngram occurrences="16" value="ñuð" /> + <ngram occurrences="16" value="ðu" /> + <ngram occurrences="16" value="çü" /> + <ngram occurrences="16" value="æúu_" /> + <ngram occurrences="16" value="æø" /> + <ngram occurrences="16" value="æ_ç" /> + <ngram occurrences="16" value="æ_ãñu" /> + <ngram occurrences="16" value="æ_ãñ" /> + <ngram occurrences="16" value="ãñuð_" /> + <ngram occurrences="16" value="ãñuð" /> + <ngram occurrences="16" value="ãuè" /> + <ngram occurrences="16" value="âð_" /> + <ngram occurrences="16" value="_ð_ç" /> + <ngram occurrences="16" value="_é_" /> + <ngram occurrences="16" value="_ãñuð" /> + <ngram occurrences="15" value="æ_ü" /> + <ngram occurrences="15" value="_ô_" /> + <ngram occurrences="14" value="úu_æ" /> + <ngram occurrences="14" value="ð_ü" /> + <ngram occurrences="14" value="çß" /> + <ngram occurrences="14" value="æü_" /> + <ngram occurrences="14" value="æù_" /> + <ngram occurrences="14" value="æ_â" /> + <ngram occurrences="14" value="åu" /> + <ngram occurrences="14" value="_üð" /> + <ngram occurrences="14" value="_âð" /> + <ngram occurrences="14" value="_âæ" /> + <ngram occurrences="13" value="õúu" /> + <ngram occurrences="13" value="õú" /> + <ngram occurrences="13" value="î_" /> + <ngram occurrences="13" value="ë" /> + <ngram occurrences="13" value="ç¸" /> + <ngram occurrences="13" value="âè" /> + <ngram occurrences="13" value="_çü" /> + <ngram occurrences="13" value="_à" /> + <ngram occurrences="12" value="üð_" /> + <ngram occurrences="12" value="ü_æ" /> + <ngram occurrences="12" value="öæ" /> + <ngram occurrences="12" value="ìæ_" /> + <ngram occurrences="12" value="çù" /> + <ngram occurrences="12" value="âý" /> + <ngram occurrences="12" value="uù" /> + <ngram occurrences="12" value="_úuæ" /> + <ngram occurrences="12" value="_ù_" /> + <ngram occurrences="12" value="_øæ" /> + <ngram occurrences="12" value="_çß" /> + <ngram occurrences="12" value="_ææ" /> + <ngram occurrences="12" value="_å" /> + <ngram occurrences="12" value="_âð_" /> + <ngram occurrences="11" value="üø" /> + <ngram occurrences="11" value="úuè" /> + <ngram occurrences="11" value="úuæ_" /> + <ngram occurrences="11" value="úu_â" /> + <ngram occurrences="11" value="ùè" /> + <ngram occurrences="11" value="õ_" /> + <ngram occurrences="11" value="ðç" /> + <ngram occurrences="11" value="ðu_" /> + <ngram occurrences="11" value="ð_ã" /> + <ngram occurrences="11" value="è¸" /> + <ngram occurrences="11" value="è_æ" /> + <ngram occurrences="11" value="è_ã" /> + <ngram occurrences="11" value="ç¸u" /> + <ngram occurrences="11" value="ææ_" /> + <ngram occurrences="11" value="âúu_" /> + <ngram occurrences="11" value="âúu" /> + <ngram occurrences="11" value="âú" /> + <ngram occurrences="11" value="áæ" /> + <ngram occurrences="11" value="uâ" /> + <ngram occurrences="11" value="_ì_" /> + <ngram occurrences="11" value="_æð_" /> + <ngram occurrences="11" value="_âý" /> + <ngram occurrences="11" value="_âúu_" /> + <ngram occurrences="11" value="_âúu" /> + <ngram occurrences="11" value="_âú" /> + <ngram occurrences="11" value="_s" /> + <ngram occurrences="10" value="¸_ð" /> + <ngram occurrences="10" value="úuã" /> + <ngram occurrences="10" value="úu_ç" /> + <ngram occurrences="10" value="ùè_" /> + <ngram occurrences="10" value="ùæ" /> + <ngram occurrences="10" value="õúu_" /> + <ngram occurrences="10" value="ñu_" /> + <ngram occurrences="10" value="ð_çü" /> + <ngram occurrences="10" value="æì" /> + <ngram occurrences="10" value="æç" /> + <ngram occurrences="10" value="æ_úu" /> + <ngram occurrences="10" value="æ_ú" /> + <ngram occurrences="10" value="æ_ð_" /> + <ngram occurrences="10" value="æ_ð" /> + <ngram occurrences="10" value="ãñu_" /> + <ngram occurrences="10" value="ãuæ" /> + <ngram occurrences="10" value="âù" /> + <ngram occurrences="10" value="âæ_" /> + <ngram occurrences="10" value="ß_" /> + <ngram occurrences="10" value="uì" /> + <ngram occurrences="10" value="uã" /> + <ngram occurrences="10" value="u_ð" /> + <ngram occurrences="10" value="u_æ_" /> + <ngram occurrences="10" value="_üæ" /> + <ngram occurrences="10" value="_ø_" /> + <ngram occurrences="10" value="_çù" /> + <ngram occurrences="10" value="_ãñu_" /> + <ngram occurrences="9" value="¸u_" /> + <ngram occurrences="9" value="úuù" /> + <ngram occurrences="9" value="úuè_" /> + <ngram occurrences="9" value="ù_æ" /> + <ngram occurrences="9" value="ð_ð" /> + <ngram occurrences="9" value="ìè" /> + <ngram occurrences="9" value="è¸_" /> + <ngram occurrences="9" value="è_ú" /> + <ngram occurrences="9" value="è_õ" /> + <ngram occurrences="9" value="çú" /> + <ngram occurrences="9" value="çî" /> + <ngram occurrences="9" value="çu" /> + <ngram occurrences="9" value="æð¸_" /> + <ngram occurrences="9" value="æð¸" /> + <ngram occurrences="9" value="æá" /> + <ngram occurrences="9" value="æ_ø" /> + <ngram occurrences="9" value="âê" /> + <ngram occurrences="9" value="á_" /> + <ngram occurrences="9" value="uè¸" /> + <ngram occurrences="9" value="u_ç_" /> + <ngram occurrences="9" value="u_ã" /> + <ngram occurrences="9" value="_øæ_" /> + <ngram occurrences="9" value="_öæ" /> + <ngram occurrences="9" value="_ð_çü" /> + <ngram occurrences="9" value="_æúu_" /> + <ngram occurrences="9" value="_âù" /> + <ngram occurrences="9" value="_âè" /> + <ngram occurrences="9" value="_áæ" /> + <ngram occurrences="8" value="¸_ð_" /> + <ngram occurrences="8" value="ÿæ" /> + <ngram occurrences="8" value="ÿ" /> + <ngram occurrences="8" value="üæ_" /> + <ngram occurrences="8" value="úu_æ_" /> + <ngram occurrences="8" value="ùæ_" /> + <ngram occurrences="8" value="õæ" /> + <ngram occurrences="8" value="ð_ú" /> + <ngram occurrences="8" value="ð_õ" /> + <ngram occurrences="8" value="ð_ãu" /> + <ngram occurrences="8" value="îð" /> + <ngram occurrences="8" value="îè" /> + <ngram occurrences="8" value="îæ" /> + <ngram occurrences="8" value="è_úu" /> + <ngram occurrences="8" value="çúu" /> + <ngram occurrences="8" value="æè_" /> + <ngram occurrences="8" value="æè" /> + <ngram occurrences="8" value="æ_ç_" /> + <ngram occurrences="8" value="ãuô" /> + <ngram occurrences="8" value="ãuè¸" /> + <ngram occurrences="8" value="ãuè_" /> + <ngram occurrences="8" value="uõ" /> + <ngram occurrences="8" value="u_î" /> + <ngram occurrences="8" value="_üð_" /> + <ngram occurrences="8" value="_úuù" /> + <ngram occurrences="8" value="_õ_" /> + <ngram occurrences="8" value="_ð_â" /> + <ngram occurrences="8" value="_í" /> + <ngram occurrences="8" value="_æ_ü" /> + <ngram occurrences="8" value="_ãuô" /> + <ngram occurrences="8" value="_u_" /> + <ngram occurrences="7" value="¸_æ" /> + <ngram occurrences="7" value="üè" /> + <ngram occurrences="7" value="ü_ð" /> + <ngram occurrences="7" value="úuì" /> + <ngram occurrences="7" value="ùãuè¸" /> + <ngram occurrences="7" value="ùãuè" /> + <ngram occurrences="7" value="ùãu" /> + <ngram occurrences="7" value="ùã" /> + <ngram occurrences="7" value="ù_ç" /> + <ngram occurrences="7" value="ù_â" /> + <ngram occurrences="7" value="øð" /> + <ngram occurrences="7" value="öè_" /> + <ngram occurrences="7" value="öè" /> + <ngram occurrences="7" value="ô_â" /> + <ngram occurrences="7" value="ð_úu" /> + <ngram occurrences="7" value="ïæ" /> + <ngram occurrences="7" value="íæ" /> + <ngram occurrences="7" value="ìæ_ãñ" /> + <ngram occurrences="7" value="ìæ_ã" /> + <ngram occurrences="7" value="è_ð" /> + <ngram occurrences="7" value="çü_" /> + <ngram occurrences="7" value="çù_" /> + <ngram occurrences="7" value="ç_ø" /> + <ngram occurrences="7" value="æ_æ_" /> + <ngram occurrences="7" value="ãuè¸_" /> + <ngram occurrences="7" value="ãuæ_" /> + <ngram occurrences="7" value="âè_" /> + <ngram occurrences="7" value="â_ð_" /> + <ngram occurrences="7" value="â_ð" /> + <ngram occurrences="7" value="â_æ" /> + <ngram occurrences="7" value="áæ_" /> + <ngram occurrences="7" value="àæ_" /> + <ngram occurrences="7" value="¹_" /> + <ngram occurrences="7" value="uùð_" /> + <ngram occurrences="7" value="uùð" /> + <ngram occurrences="7" value="uô¸" /> + <ngram occurrences="7" value="uô_" /> + <ngram occurrences="7" value="uè¸_" /> + <ngram occurrences="7" value="u_è" /> + <ngram occurrences="7" value="_úuã" /> + <ngram occurrences="7" value="_ùð_" /> + <ngram occurrences="7" value="_ùð" /> + <ngram occurrences="7" value="_ùãuè" /> + <ngram occurrences="7" value="_ùãu" /> + <ngram occurrences="7" value="_ùã" /> + <ngram occurrences="7" value="_öè_" /> + <ngram occurrences="7" value="_öè" /> + <ngram occurrences="7" value="_õúu_" /> + <ngram occurrences="7" value="_õúu" /> + <ngram occurrences="7" value="_õú" /> + <ngram occurrences="7" value="_õæ" /> + <ngram occurrences="7" value="_çü_" /> + <ngram occurrences="7" value="_æü" /> + <ngram occurrences="7" value="_æø" /> + <ngram occurrences="7" value="_æ_æ" /> + <ngram occurrences="7" value="_åu" /> + <ngram occurrences="7" value="_ãuæ" /> + <ngram occurrences="7" value="_âê" /> + <ngram occurrences="7" value="_àæ" /> + <ngram occurrences="7" value="_ßæ" /> + <ngram occurrences="6" value="üðç_ù" /> + <ngram occurrences="6" value="üðç_" /> + <ngram occurrences="6" value="üðç" /> + <ngram occurrences="6" value="úuùð_" /> + <ngram occurrences="6" value="úuùð" /> + <ngram occurrences="6" value="úuô" /> + <ngram occurrences="6" value="úuãu" /> + <ngram occurrences="6" value="øð_" /> + <ngram occurrences="6" value="øãu" /> + <ngram occurrences="6" value="øã" /> + <ngram occurrences="6" value="ø_æ" /> + <ngram occurrences="6" value="ñuð_â" /> + <ngram occurrences="6" value="ðç_ù_" /> + <ngram occurrences="6" value="ðç_ù" /> + <ngram occurrences="6" value="ðç_" /> + <ngram occurrences="6" value="ð_ö" /> + <ngram occurrences="6" value="ð_ð_" /> + <ngram occurrences="6" value="ð_çü_" /> + <ngram occurrences="6" value="ð_çß" /> + <ngram occurrences="6" value="ð_æ_" /> + <ngram occurrences="6" value="ð_â_" /> + <ngram occurrences="6" value="îè_" /> + <ngram occurrences="6" value="êú" /> + <ngram occurrences="6" value="éu" /> + <ngram occurrences="6" value="èð_" /> + <ngram occurrences="6" value="èð" /> + <ngram occurrences="6" value="è_ç" /> + <ngram occurrences="6" value="è_æ_" /> + <ngram occurrences="6" value="çüø" /> + <ngram occurrences="6" value="ç_ù_" /> + <ngram occurrences="6" value="ç_ù" /> + <ngram occurrences="6" value="ç_ì" /> + <ngram occurrences="6" value="æúuæ" /> + <ngram occurrences="6" value="æì_" /> + <ngram occurrences="6" value="æã" /> + <ngram occurrences="6" value="æâ" /> + <ngram occurrences="6" value="æ_ô" /> + <ngram occurrences="6" value="æ_ì" /> + <ngram occurrences="6" value="æ_é" /> + <ngram occurrences="6" value="æ_á" /> + <ngram occurrences="6" value="åuè_" /> + <ngram occurrences="6" value="åuè" /> + <ngram occurrences="6" value="ãð" /> + <ngram occurrences="6" value="ãuô_" /> + <ngram occurrences="6" value="âü" /> + <ngram occurrences="6" value="âùè_" /> + <ngram occurrences="6" value="âùè" /> + <ngram occurrences="6" value="âç" /> + <ngram occurrences="6" value="â_ì" /> + <ngram occurrences="6" value="àu" /> + <ngram occurrences="6" value="ßãu" /> + <ngram occurrences="6" value="ßã" /> + <ngram occurrences="6" value="uúu" /> +</ngrams> diff --git a/src/plugins/language/hungarian.klp b/src/plugins/language/hungarian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="581" value="_" /> + <ngram occurrences="339" value="e" /> + <ngram occurrences="301" value="a" /> + <ngram occurrences="263" value="t" /> + <ngram occurrences="211" value="s" /> + <ngram occurrences="209" value="k" /> + <ngram occurrences="191" value="l" /> + <ngram occurrences="179" value="n" /> + <ngram occurrences="158" value="r" /> + <ngram occurrences="146" value="z" /> + <ngram occurrences="145" value="i" /> + <ngram occurrences="136" value="é" /> + <ngram occurrences="127" value="o" /> + <ngram occurrences="126" value="g" /> + <ngram occurrences="115" value="á" /> + <ngram occurrences="102" value="m" /> + <ngram occurrences="93" value="_a" /> + <ngram occurrences="90" value="a_" /> + <ngram occurrences="84" value="t_" /> + <ngram occurrences="80" value="y" /> + <ngram occurrences="77" value="b" /> + <ngram occurrences="73" value="d" /> + <ngram occurrences="72" value="v" /> + <ngram occurrences="70" value="k_" /> + <ngram occurrences="61" value="sz" /> + <ngram occurrences="57" value="_m" /> + <ngram occurrences="57" value="_a_" /> + <ngram occurrences="54" value="gy" /> + <ngram occurrences="50" value="h" /> + <ngram occurrences="48" value="ö" /> + <ngram occurrences="47" value="et" /> + <ngram occurrences="46" value="s_" /> + <ngram occurrences="45" value="_k" /> + <ngram occurrences="44" value="p" /> + <ngram occurrences="44" value="_e" /> + <ngram occurrences="42" value="ó" /> + <ngram occurrences="42" value="u" /> + <ngram occurrences="41" value="e_" /> + <ngram occurrences="40" value="_s" /> + <ngram occurrences="39" value="i_" /> + <ngram occurrences="39" value="en" /> + <ngram occurrences="38" value="eg" /> + <ngram occurrences="37" value="n_" /> + <ngram occurrences="34" value="le" /> + <ngram occurrences="34" value="el" /> + <ngram occurrences="33" value="_h" /> + <ngram occurrences="32" value="j" /> + <ngram occurrences="30" value="te" /> + <ngram occurrences="30" value="f" /> + <ngram occurrences="30" value="ek" /> + <ngram occurrences="30" value="ak" /> + <ngram occurrences="30" value="_sz" /> + <ngram occurrences="29" value="l_" /> + <ngram occurrences="29" value="al" /> + <ngram occurrences="29" value="_é" /> + <ngram occurrences="28" value="õ" /> + <ngram occurrences="28" value="ár" /> + <ngram occurrences="28" value="y_" /> + <ngram occurrences="28" value="_t" /> + <ngram occurrences="27" value="és" /> + <ngram occurrences="27" value="z_" /> + <ngram occurrences="27" value="ke" /> + <ngram occurrences="27" value="er" /> + <ngram occurrences="27" value="az" /> + <ngram occurrences="26" value="ta" /> + <ngram occurrences="26" value="es" /> + <ngram occurrences="26" value="_v" /> + <ngram occurrences="26" value="_i" /> + <ngram occurrences="25" value="tt" /> + <ngram occurrences="25" value="re" /> + <ngram occurrences="25" value="_n" /> + <ngram occurrences="24" value="í" /> + <ngram occurrences="23" value="ze" /> + <ngram occurrences="23" value="té" /> + <ngram occurrences="23" value="or" /> + <ngram occurrences="22" value="gy_" /> + <ngram occurrences="22" value="_b" /> + <ngram occurrences="22" value="_az" /> + <ngram occurrences="21" value="ne" /> + <ngram occurrences="21" value="me" /> + <ngram occurrences="21" value="ag" /> + <ngram occurrences="20" value="zt" /> + <ngram occurrences="20" value="ny" /> + <ngram occurrences="20" value="ko" /> + <ngram occurrences="20" value="ki" /> + <ngram occurrences="20" value="az_" /> + <ngram occurrences="20" value="_f" /> + <ngram occurrences="19" value="ér" /> + <ngram occurrences="19" value="ve" /> + <ngram occurrences="19" value="va" /> + <ngram occurrences="19" value="na" /> + <ngram occurrences="19" value="ll" /> + <ngram occurrences="19" value="at" /> + <ngram occurrences="19" value="an" /> + <ngram occurrences="19" value="_az_" /> + <ngram occurrences="18" value="én" /> + <ngram occurrences="18" value="tá" /> + <ngram occurrences="18" value="is" /> + <ngram occurrences="18" value="egy" /> + <ngram occurrences="18" value="ak_" /> + <ngram occurrences="17" value="ás" /> + <ngram occurrences="17" value="tt_" /> + <ngram occurrences="17" value="r_" /> + <ngram occurrences="17" value="ol" /> + <ngram occurrences="17" value="mi" /> + <ngram occurrences="17" value="g_" /> + <ngram occurrences="17" value="et_" /> + <ngram occurrences="17" value="ek_" /> + <ngram occurrences="16" value="ü" /> + <ngram occurrences="16" value="ít" /> + <ngram occurrences="16" value="ég" /> + <ngram occurrences="16" value="os" /> + <ngram occurrences="16" value="nk" /> + <ngram occurrences="16" value="c" /> + <ngram occurrences="15" value="zá" /> + <ngram occurrences="15" value="ye" /> + <ngram occurrences="15" value="ra" /> + <ngram occurrences="15" value="on" /> + <ngram occurrences="15" value="la" /> + <ngram occurrences="15" value="ho" /> + <ngram occurrences="15" value="be" /> + <ngram occurrences="15" value="agy" /> + <ngram occurrences="15" value="_ki" /> + <ngram occurrences="15" value="_eg" /> + <ngram occurrences="14" value="ú" /> + <ngram occurrences="14" value="ép" /> + <ngram occurrences="14" value="sze" /> + <ngram occurrences="14" value="se" /> + <ngram occurrences="14" value="rt" /> + <ngram occurrences="14" value="ma" /> + <ngram occurrences="14" value="en_" /> + <ngram occurrences="14" value="em" /> + <ngram occurrences="14" value="_me" /> + <ngram occurrences="14" value="_egy" /> + <ngram occurrences="13" value="és_" /> + <ngram occurrences="13" value="ál" /> + <ngram occurrences="13" value="za" /> + <ngram occurrences="13" value="to" /> + <ngram occurrences="13" value="t_a" /> + <ngram occurrences="13" value="sé" /> + <ngram occurrences="13" value="ok" /> + <ngram occurrences="13" value="kö" /> + <ngram occurrences="13" value="ik" /> + <ngram occurrences="13" value="_va" /> + <ngram occurrences="13" value="_l" /> + <ngram occurrences="12" value="án" /> + <ngram occurrences="12" value="sa" /> + <ngram occurrences="12" value="ro" /> + <ngram occurrences="12" value="k_m" /> + <ngram occurrences="12" value="k_a" /> + <ngram occurrences="12" value="it" /> + <ngram occurrences="12" value="ha" /> + <ngram occurrences="12" value="ge" /> + <ngram occurrences="12" value="ez" /> + <ngram occurrences="12" value="ar" /> + <ngram occurrences="12" value="_és_" /> + <ngram occurrences="12" value="_és" /> + <ngram occurrences="12" value="_is" /> + <ngram occurrences="11" value="ét" /> + <ngram occurrences="11" value="szá" /> + <ngram occurrences="11" value="nd" /> + <ngram occurrences="11" value="ett" /> + <ngram occurrences="11" value="da" /> + <ngram occurrences="11" value="cs" /> + <ngram occurrences="11" value="bb" /> + <ngram occurrences="11" value="ba" /> + <ngram occurrences="11" value="_mi" /> + <ngram occurrences="11" value="_ho" /> + <ngram occurrences="10" value="õ_" /> + <ngram occurrences="10" value="ô" /> + <ngram occurrences="10" value="ól" /> + <ngram occurrences="10" value="ás_" /> + <ngram occurrences="10" value="zer" /> + <ngram occurrences="10" value="t_a_" /> + <ngram occurrences="10" value="rs" /> + <ngram occurrences="10" value="oz" /> + <ngram occurrences="10" value="og" /> + <ngram occurrences="10" value="mé" /> + <ngram occurrences="10" value="má" /> + <ngram occurrences="10" value="mo" /> + <ngram occurrences="10" value="meg" /> + <ngram occurrences="10" value="kor" /> + <ngram occurrences="10" value="iz" /> + <ngram occurrences="10" value="in" /> + <ngram occurrences="10" value="de" /> + <ngram occurrences="10" value="ap" /> + <ngram occurrences="10" value="an_" /> + <ngram occurrences="10" value="a_m" /> + <ngram occurrences="10" value="a_h" /> + <ngram occurrences="10" value="_meg" /> + <ngram occurrences="10" value="_ke" /> + <ngram occurrences="10" value="_ha" /> + <ngram occurrences="10" value="_d" /> + <ngram occurrences="9" value="ól_" /> + <ngram occurrences="9" value="ág" /> + <ngram occurrences="9" value="zé" /> + <ngram occurrences="9" value="vé" /> + <ngram occurrences="9" value="ut" /> + <ngram occurrences="9" value="ul" /> + <ngram occurrences="9" value="szer" /> + <ngram occurrences="9" value="st" /> + <ngram occurrences="9" value="so" /> + <ngram occurrences="9" value="re_" /> + <ngram occurrences="9" value="pe" /> + <ngram occurrences="9" value="né" /> + <ngram occurrences="9" value="nt" /> + <ngram occurrences="9" value="n_a" /> + <ngram occurrences="9" value="lá" /> + <ngram occurrences="9" value="lt" /> + <ngram occurrences="9" value="li" /> + <ngram occurrences="9" value="ka" /> + <ngram occurrences="9" value="is_" /> + <ngram occurrences="9" value="ik_" /> + <ngram occurrences="9" value="egy_" /> + <ngram occurrences="9" value="as" /> + <ngram occurrences="9" value="ai" /> + <ngram occurrences="9" value="a_b" /> + <ngram occurrences="9" value="a_a" /> + <ngram occurrences="9" value="_r" /> + <ngram occurrences="9" value="_ma" /> + <ngram occurrences="9" value="_j" /> + <ngram occurrences="9" value="_g" /> + <ngram occurrences="9" value="_a_m" /> + <ngram occurrences="8" value="öv" /> + <ngram occurrences="8" value="ó_" /> + <ngram occurrences="8" value="ény" /> + <ngram occurrences="8" value="ék" /> + <ngram occurrences="8" value="ár_" /> + <ngram occurrences="8" value="áll" /> + <ngram occurrences="8" value="zi" /> + <ngram occurrences="8" value="tö" /> + <ngram occurrences="8" value="t_e" /> + <ngram occurrences="8" value="sít" /> + <ngram occurrences="8" value="sí" /> + <ngram occurrences="8" value="ség" /> + <ngram occurrences="8" value="ss" /> + <ngram occurrences="8" value="s_a" /> + <ngram occurrences="8" value="nn" /> + <ngram occurrences="8" value="m_" /> + <ngram occurrences="8" value="ló" /> + <ngram occurrences="8" value="lle" /> + <ngram occurrences="8" value="let" /> + <ngram occurrences="8" value="ká" /> + <ngram occurrences="8" value="kr" /> + <ngram occurrences="8" value="il" /> + <ngram occurrences="8" value="ele" /> + <ngram occurrences="8" value="do" /> + <ngram occurrences="8" value="bi" /> + <ngram occurrences="8" value="ban_" /> + <ngram occurrences="8" value="ban" /> + <ngram occurrences="8" value="ad" /> + <ngram occurrences="8" value="a_v" /> + <ngram occurrences="8" value="_le" /> + <ngram occurrences="8" value="_is_" /> + <ngram occurrences="8" value="_es" /> + <ngram occurrences="8" value="_el" /> + <ngram occurrences="8" value="_egy_" /> + <ngram occurrences="7" value="û" /> + <ngram occurrences="7" value="öt" /> + <ngram occurrences="7" value="ör" /> + <ngram occurrences="7" value="öl" /> + <ngram occurrences="7" value="ók" /> + <ngram occurrences="7" value="év" /> + <ngram occurrences="7" value="ét_" /> + <ngram occurrences="7" value="át" /> + <ngram occurrences="7" value="ák" /> + <ngram occurrences="7" value="áb" /> + <ngram occurrences="7" value="z_a" /> + <ngram occurrences="7" value="ya" /> + <ngram occurrences="7" value="vén" /> + <ngram occurrences="7" value="vá" /> + <ngram occurrences="7" value="vagy" /> + <ngram occurrences="7" value="vag" /> + <ngram occurrences="7" value="ud" /> + <ngram occurrences="7" value="tés" /> + <ngram occurrences="7" value="tet" /> + <ngram occurrences="7" value="szé" /> + <ngram occurrences="7" value="sza" /> + <ngram occurrences="7" value="rá" /> + <ngram occurrences="7" value="ri" /> + <ngram occurrences="7" value="rd" /> + <ngram occurrences="7" value="ot" /> + <ngram occurrences="7" value="nk_" /> + <ngram occurrences="7" value="nak_" /> + <ngram occurrences="7" value="nak" /> + <ngram occurrences="7" value="min" /> + <ngram occurrences="7" value="kár" /> + <ngram occurrences="7" value="ket_" /> + <ngram occurrences="7" value="ket" /> + <ngram occurrences="7" value="k_s" /> + <ngram occurrences="7" value="k_a_" /> + <ngram occurrences="7" value="há" /> + <ngram occurrences="7" value="hog" /> + <ngram occurrences="7" value="gye" /> + <ngram occurrences="7" value="fe" /> + <ngram occurrences="7" value="ett_" /> + <ngram occurrences="7" value="e_a" /> + <ngram occurrences="7" value="bu" /> + <ngram occurrences="7" value="b_" /> + <ngram occurrences="7" value="am" /> + <ngram occurrences="7" value="a_s" /> + <ngram occurrences="7" value="_ér" /> + <ngram occurrences="7" value="_á" /> + <ngram occurrences="7" value="_vagy" /> + <ngram occurrences="7" value="_vag" /> + <ngram occurrences="7" value="_u" /> + <ngram occurrences="7" value="_tö" /> + <ngram occurrences="7" value="_te" /> + <ngram occurrences="7" value="_p" /> + <ngram occurrences="7" value="_né" /> + <ngram occurrences="7" value="_na" /> + <ngram occurrences="7" value="_má" /> + <ngram occurrences="7" value="_mo" /> + <ngram occurrences="7" value="_kö" /> + <ngram occurrences="7" value="_hog" /> + <ngram occurrences="7" value="_be" /> + <ngram occurrences="7" value="_a_h" /> + <ngram occurrences="6" value="ön" /> + <ngram occurrences="6" value="ég_" /> + <ngram occurrences="6" value="zõ" /> + <ngram occurrences="6" value="ztosí" /> + <ngram occurrences="6" value="ztos" /> + <ngram occurrences="6" value="zto" /> + <ngram occurrences="6" value="zs" /> + <ngram occurrences="6" value="zet" /> + <ngram occurrences="6" value="yi" /> + <ngram occurrences="6" value="yek" /> + <ngram occurrences="6" value="y_e" /> + <ngram occurrences="6" value="vagy_" /> + <ngram occurrences="6" value="uda" /> + <ngram occurrences="6" value="tó" /> + <ngram occurrences="6" value="tosít" /> + <ngram occurrences="6" value="tosí" /> + <ngram occurrences="6" value="tos" /> + <ngram occurrences="6" value="te_" /> + <ngram occurrences="6" value="t_é" /> + <ngram occurrences="6" value="t_t" /> + <ngram occurrences="6" value="t_m" /> + <ngram occurrences="6" value="t_k" /> + <ngram occurrences="6" value="t_i" /> + <ngram occurrences="6" value="t_h" /> + <ngram occurrences="6" value="sok" /> + <ngram occurrences="6" value="rz" /> + <ngram occurrences="6" value="rv" /> + <ngram occurrences="6" value="ps" /> + <ngram occurrences="6" value="po" /> + <ngram occurrences="6" value="pa" /> + <ngram occurrences="6" value="osít" /> + <ngram occurrences="6" value="osí" /> + <ngram occurrences="6" value="om" /> + <ngram occurrences="6" value="ogy_" /> + <ngram occurrences="6" value="ogy" /> + <ngram occurrences="6" value="nye" /> + <ngram occurrences="6" value="nt_" /> + <ngram occurrences="6" value="ne_" /> + <ngram occurrences="6" value="ly" /> + <ngram occurrences="6" value="li_" /> + <ngram occurrences="6" value="ké" /> + <ngram occurrences="6" value="ki_" /> + <ngram occurrences="6" value="kb" /> + <ngram occurrences="6" value="k_sz" /> + <ngram occurrences="6" value="k_e" /> + <ngram occurrences="6" value="já" /> + <ngram occurrences="6" value="iztos" /> + <ngram occurrences="6" value="izto" /> + <ngram occurrences="6" value="izt" /> + <ngram occurrences="6" value="id" /> + <ngram occurrences="6" value="i_k" /> + <ngram occurrences="6" value="hogy_" /> + <ngram occurrences="6" value="hogy" /> + <ngram occurrences="6" value="he" /> + <ngram occurrences="6" value="ga" /> + <ngram occurrences="6" value="esz" /> + <ngram occurrences="6" value="ere" /> + <ngram occurrences="6" value="ell" /> + <ngram occurrences="6" value="eh" /> + <ngram occurrences="6" value="e_h" /> + <ngram occurrences="6" value="di" /> + <ngram occurrences="6" value="buda" /> + <ngram occurrences="6" value="bud" /> + <ngram occurrences="6" value="bizto" /> + <ngram occurrences="6" value="bizt" /> + <ngram occurrences="6" value="biz" /> + <ngram occurrences="6" value="ben" /> + <ngram occurrences="6" value="at_" /> + <ngram occurrences="6" value="al_" /> + <ngram occurrences="6" value="ak_a" /> + <ngram occurrences="6" value="ai_" /> + <ngram occurrences="6" value="agy_" /> + <ngram occurrences="6" value="a_ha" /> + <ngram occurrences="6" value="_év" /> + <ngram occurrences="6" value="_ut" /> + <ngram occurrences="6" value="_szé" /> + <ngram occurrences="6" value="_sze" /> + <ngram occurrences="6" value="_re" /> + <ngram occurrences="6" value="_ne" /> + <ngram occurrences="6" value="_mé" /> + <ngram occurrences="6" value="_min" /> + <ngram occurrences="6" value="_hogy" /> + <ngram occurrences="6" value="_gy" /> +</ngrams> diff --git a/src/plugins/language/icelandic.klp b/src/plugins/language/icelandic.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="743" value="_" /> + <ngram occurrences="337" value="a" /> + <ngram occurrences="318" value="r" /> + <ngram occurrences="285" value="n" /> + <ngram occurrences="255" value="i" /> + <ngram occurrences="249" value="u" /> + <ngram occurrences="243" value="e" /> + <ngram occurrences="207" value="s" /> + <ngram occurrences="179" value="t" /> + <ngram occurrences="175" value="ð" /> + <ngram occurrences="167" value="l" /> + <ngram occurrences="165" value="g" /> + <ngram occurrences="152" value="k" /> + <ngram occurrences="140" value="m" /> + <ngram occurrences="135" value="f" /> + <ngram occurrences="118" value="r_" /> + <ngram occurrences="82" value="ð_" /> + <ngram occurrences="81" value="_s" /> + <ngram occurrences="76" value="v" /> + <ngram occurrences="75" value="í" /> + <ngram occurrences="73" value="ar" /> + <ngram occurrences="70" value="o" /> + <ngram occurrences="69" value="m_" /> + <ngram occurrences="66" value="a_" /> + <ngram occurrences="64" value="á" /> + <ngram occurrences="64" value="að" /> + <ngram occurrences="63" value="j" /> + <ngram occurrences="58" value="i_" /> + <ngram occurrences="57" value="_f" /> + <ngram occurrences="56" value="u_" /> + <ngram occurrences="56" value="n_" /> + <ngram occurrences="55" value="æ" /> + <ngram occurrences="55" value="in" /> + <ngram occurrences="55" value="h" /> + <ngram occurrences="54" value="_e" /> + <ngram occurrences="53" value="_a" /> + <ngram occurrences="51" value="b" /> + <ngram occurrences="50" value="_í" /> + <ngram occurrences="49" value="um" /> + <ngram occurrences="48" value="ur" /> + <ngram occurrences="48" value="g_" /> + <ngram occurrences="47" value="d" /> + <ngram occurrences="47" value="að_" /> + <ngram occurrences="45" value="í_" /> + <ngram occurrences="45" value="um_" /> + <ngram occurrences="45" value="_h" /> + <ngram occurrences="44" value="st" /> + <ngram occurrences="44" value="er" /> + <ngram occurrences="44" value="_í_" /> + <ngram occurrences="43" value="þ" /> + <ngram occurrences="43" value="ö" /> + <ngram occurrences="43" value="ó" /> + <ngram occurrences="42" value="nn" /> + <ngram occurrences="42" value="_v" /> + <ngram occurrences="41" value="ei" /> + <ngram occurrences="41" value="_þ" /> + <ngram occurrences="40" value="nu" /> + <ngram occurrences="38" value="ið" /> + <ngram occurrences="37" value="y" /> + <ngram occurrences="37" value="ur_" /> + <ngram occurrences="37" value="_á" /> + <ngram occurrences="37" value="_m" /> + <ngram occurrences="37" value="_að" /> + <ngram occurrences="36" value="á_" /> + <ngram occurrences="36" value="ir" /> + <ngram occurrences="36" value="an" /> + <ngram occurrences="36" value="_o" /> + <ngram occurrences="35" value="ve" /> + <ngram occurrences="35" value="p" /> + <ngram occurrences="34" value="un" /> + <ngram occurrences="34" value="og" /> + <ngram occurrences="34" value="ar_" /> + <ngram occurrences="33" value="og_" /> + <ngram occurrences="33" value="_og_" /> + <ngram occurrences="33" value="_og" /> + <ngram occurrences="32" value="_b" /> + <ngram occurrences="31" value="ta" /> + <ngram occurrences="31" value="_að_" /> + <ngram occurrences="30" value="t_" /> + <ngram occurrences="30" value="na" /> + <ngram occurrences="29" value="ðu" /> + <ngram occurrences="29" value="en" /> + <ngram occurrences="29" value="_g" /> + <ngram occurrences="28" value="ti" /> + <ngram occurrences="28" value="ri" /> + <ngram occurrences="28" value="lu" /> + <ngram occurrences="28" value="la" /> + <ngram occurrences="27" value="ú" /> + <ngram occurrences="27" value="_u" /> + <ngram occurrences="26" value="_á_" /> + <ngram occurrences="26" value="_ve" /> + <ngram occurrences="25" value="ði" /> + <ngram occurrences="24" value="ng" /> + <ngram occurrences="24" value="nd" /> + <ngram occurrences="24" value="ja" /> + <ngram occurrences="23" value="sl" /> + <ngram occurrences="23" value="rð" /> + <ngram occurrences="23" value="ra" /> + <ngram occurrences="23" value="kk" /> + <ngram occurrences="23" value="ki" /> + <ngram occurrences="23" value="ið_" /> + <ngram occurrences="23" value="_t" /> + <ngram occurrences="22" value="ir_" /> + <ngram occurrences="21" value="ef" /> + <ngram occurrences="20" value="tu" /> + <ngram occurrences="20" value="ku" /> + <ngram occurrences="20" value="ga" /> + <ngram occurrences="20" value="em" /> + <ngram occurrences="20" value="_n" /> + <ngram occurrences="20" value="_l" /> + <ngram occurrences="19" value="é" /> + <ngram occurrences="19" value="sk" /> + <ngram occurrences="19" value="se" /> + <ngram occurrences="19" value="re" /> + <ngram occurrences="19" value="inn" /> + <ngram occurrences="19" value="il" /> + <ngram occurrences="19" value="_k" /> + <ngram occurrences="18" value="ða" /> + <ngram occurrences="18" value="ver" /> + <ngram occurrences="18" value="s_" /> + <ngram occurrences="17" value="nn_" /> + <ngram occurrences="17" value="ni" /> + <ngram occurrences="17" value="ek" /> + <ngram occurrences="17" value="af" /> + <ngram occurrences="17" value="_er" /> + <ngram occurrences="16" value="sem" /> + <ngram occurrences="16" value="num_" /> + <ngram occurrences="16" value="num" /> + <ngram occurrences="16" value="mi" /> + <ngram occurrences="16" value="ka" /> + <ngram occurrences="16" value="eg" /> + <ngram occurrences="16" value="_ver" /> + <ngram occurrences="16" value="_se" /> + <ngram occurrences="15" value="ði_" /> + <ngram occurrences="15" value="sem_" /> + <ngram occurrences="15" value="lö" /> + <ngram occurrences="15" value="gu" /> + <ngram occurrences="15" value="gi" /> + <ngram occurrences="15" value="es" /> + <ngram occurrences="15" value="em_" /> + <ngram occurrences="15" value="da" /> + <ngram occurrences="15" value="ag" /> + <ngram occurrences="15" value="_sem_" /> + <ngram occurrences="15" value="_sem" /> + <ngram occurrences="14" value="þe" /> + <ngram occurrences="14" value="ður" /> + <ngram occurrences="14" value="æk" /> + <ngram occurrences="14" value="yr" /> + <ngram occurrences="14" value="rf" /> + <ngram occurrences="14" value="nar" /> + <ngram occurrences="14" value="l_" /> + <ngram occurrences="14" value="jó" /> + <ngram occurrences="14" value="ha" /> + <ngram occurrences="14" value="ge" /> + <ngram occurrences="14" value="bæ" /> + <ngram occurrences="14" value="am" /> + <ngram occurrences="14" value="_þe" /> + <ngram occurrences="13" value="þa" /> + <ngram occurrences="13" value="ög" /> + <ngram occurrences="13" value="vi" /> + <ngram occurrences="13" value="uð" /> + <ngram occurrences="13" value="tt" /> + <ngram occurrences="13" value="ne" /> + <ngram occurrences="13" value="ll" /> + <ngram occurrences="13" value="li" /> + <ngram occurrences="13" value="ki_" /> + <ngram occurrences="13" value="is" /> + <ngram occurrences="13" value="he" /> + <ngram occurrences="13" value="fr" /> + <ngram occurrences="13" value="fl" /> + <ngram occurrences="13" value="al" /> + <ngram occurrences="13" value="_þa" /> + <ngram occurrences="13" value="_ha" /> + <ngram occurrences="12" value="ík" /> + <ngram occurrences="12" value="te" /> + <ngram occurrences="12" value="r_í_" /> + <ngram occurrences="12" value="r_í" /> + <ngram occurrences="12" value="r_s" /> + <ngram occurrences="12" value="r_f" /> + <ngram occurrences="12" value="nar_" /> + <ngram occurrences="12" value="me" /> + <ngram occurrences="12" value="ma" /> + <ngram occurrences="12" value="ko" /> + <ngram occurrences="12" value="k_" /> + <ngram occurrences="12" value="ey" /> + <ngram occurrences="12" value="ekk" /> + <ngram occurrences="12" value="_he" /> + <ngram occurrences="11" value="yrir" /> + <ngram occurrences="11" value="yri" /> + <ngram occurrences="11" value="us" /> + <ngram occurrences="11" value="slu" /> + <ngram occurrences="11" value="ru" /> + <ngram occurrences="11" value="rir" /> + <ngram occurrences="11" value="ju" /> + <ngram occurrences="11" value="inu" /> + <ngram occurrences="11" value="fyrir" /> + <ngram occurrences="11" value="fyri" /> + <ngram occurrences="11" value="fyr" /> + <ngram occurrences="11" value="fy" /> + <ngram occurrences="11" value="erð" /> + <ngram occurrences="11" value="di" /> + <ngram occurrences="11" value="_mi" /> + <ngram occurrences="10" value="ðs" /> + <ngram occurrences="10" value="st_" /> + <ngram occurrences="10" value="si" /> + <ngram occurrences="10" value="sa" /> + <ngram occurrences="10" value="rðu" /> + <ngram occurrences="10" value="rn" /> + <ngram occurrences="10" value="pp" /> + <ngram occurrences="10" value="or" /> + <ngram occurrences="10" value="ns" /> + <ngram occurrences="10" value="le" /> + <ngram occurrences="10" value="kki_" /> + <ngram occurrences="10" value="kki" /> + <ngram occurrences="10" value="kj" /> + <ngram occurrences="10" value="il_" /> + <ngram occurrences="10" value="gr" /> + <ngram occurrences="10" value="fu" /> + <ngram occurrences="10" value="fj" /> + <ngram occurrences="10" value="f_" /> + <ngram occurrences="10" value="et" /> + <ngram occurrences="10" value="ekki_" /> + <ngram occurrences="10" value="ekki" /> + <ngram occurrences="10" value="br" /> + <ngram occurrences="10" value="arf" /> + <ngram occurrences="10" value="_um" /> + <ngram occurrences="10" value="_st" /> + <ngram occurrences="10" value="_ge" /> + <ngram occurrences="10" value="_ekki" /> + <ngram occurrences="10" value="_ekk" /> + <ngram occurrences="10" value="_ek" /> + <ngram occurrences="9" value="ý" /> + <ngram occurrences="9" value="ður_" /> + <ngram occurrences="9" value="ví" /> + <ngram occurrences="9" value="va" /> + <ngram occurrences="9" value="un_" /> + <ngram occurrences="9" value="til_" /> + <ngram occurrences="9" value="til" /> + <ngram occurrences="9" value="ta_" /> + <ngram occurrences="9" value="su" /> + <ngram occurrences="9" value="ru_" /> + <ngram occurrences="9" value="rs" /> + <ngram occurrences="9" value="r_k" /> + <ngram occurrences="9" value="nu_" /> + <ngram occurrences="9" value="nni" /> + <ngram occurrences="9" value="na_" /> + <ngram occurrences="9" value="lög" /> + <ngram occurrences="9" value="lu_" /> + <ngram occurrences="9" value="kur" /> + <ngram occurrences="9" value="ke" /> + <ngram occurrences="9" value="gn" /> + <ngram occurrences="9" value="fæ" /> + <ngram occurrences="9" value="er_" /> + <ngram occurrences="9" value="du" /> + <ngram occurrences="9" value="av" /> + <ngram occurrences="9" value="ann" /> + <ngram occurrences="9" value="an_" /> + <ngram occurrences="9" value="_um_" /> + <ngram occurrences="9" value="_til_" /> + <ngram occurrences="9" value="_til" /> + <ngram occurrences="9" value="_ti" /> + <ngram occurrences="9" value="_sk" /> + <ngram occurrences="9" value="_r" /> + <ngram occurrences="9" value="_me" /> + <ngram occurrences="9" value="_fyri" /> + <ngram occurrences="9" value="_fyr" /> + <ngram occurrences="9" value="_fy" /> + <ngram occurrences="9" value="_fr" /> + <ngram occurrences="9" value="_er_" /> + <ngram occurrences="9" value="_ei" /> + <ngram occurrences="8" value="út" /> + <ngram occurrences="8" value="ón" /> + <ngram occurrences="8" value="ðu_" /> + <ngram occurrences="8" value="ða_" /> + <ngram occurrences="8" value="ð_í" /> + <ngram occurrences="8" value="í_s" /> + <ngram occurrences="8" value="ær" /> + <ngram occurrences="8" value="uðu" /> + <ngram occurrences="8" value="ut" /> + <ngram occurrences="8" value="upp" /> + <ngram occurrences="8" value="up" /> + <ngram occurrences="8" value="u_e" /> + <ngram occurrences="8" value="tu_" /> + <ngram occurrences="8" value="sé" /> + <ngram occurrences="8" value="stu" /> + <ngram occurrences="8" value="ss" /> + <ngram occurrences="8" value="r_e" /> + <ngram occurrences="8" value="ngi" /> + <ngram occurrences="8" value="nes" /> + <ngram occurrences="8" value="nda" /> + <ngram occurrences="8" value="m_m" /> + <ngram occurrences="8" value="kt" /> + <ngram occurrences="8" value="ja_" /> + <ngram occurrences="8" value="it" /> + <ngram occurrences="8" value="ing" /> + <ngram occurrences="8" value="ik" /> + <ngram occurrences="8" value="hef" /> + <ngram occurrences="8" value="gar" /> + <ngram occurrences="8" value="ga_" /> + <ngram occurrences="8" value="fe" /> + <ngram occurrences="8" value="fa" /> + <ngram occurrences="8" value="eð" /> + <ngram occurrences="8" value="ein" /> + <ngram occurrences="8" value="aði" /> + <ngram occurrences="8" value="a_s" /> + <ngram occurrences="8" value="a_h" /> + <ngram occurrences="8" value="a_f" /> + <ngram occurrences="8" value="_ú" /> + <ngram occurrences="8" value="_í_s" /> + <ngram occurrences="8" value="_vi" /> + <ngram occurrences="8" value="_upp" /> + <ngram occurrences="8" value="_up" /> + <ngram occurrences="8" value="_un" /> + <ngram occurrences="8" value="_sé" /> + <ngram occurrences="8" value="_ke" /> + <ngram occurrences="8" value="_hef" /> + <ngram occurrences="8" value="_en" /> + <ngram occurrences="8" value="_bæ" /> + <ngram occurrences="8" value="_af" /> + <ngram occurrences="7" value="þar" /> + <ngram occurrences="7" value="út_" /> + <ngram occurrences="7" value="ól" /> + <ngram occurrences="7" value="ðar" /> + <ngram occurrences="7" value="ð_u" /> + <ngram occurrences="7" value="æð" /> + <ngram occurrences="7" value="æt" /> + <ngram occurrences="7" value="ækk" /> + <ngram occurrences="7" value="yrir_" /> + <ngram occurrences="7" value="vík" /> + <ngram occurrences="7" value="ust" /> + <ngram occurrences="7" value="und" /> + <ngram occurrences="7" value="t_s" /> + <ngram occurrences="7" value="rður_" /> + <ngram occurrences="7" value="rður" /> + <ngram occurrences="7" value="rt" /> + <ngram occurrences="7" value="rl" /> + <ngram occurrences="7" value="rk" /> + <ngram occurrences="7" value="rið" /> + <ngram occurrences="7" value="rir_" /> + <ngram occurrences="7" value="rey" /> + <ngram occurrences="7" value="ram" /> + <ngram occurrences="7" value="r_h" /> + <ngram occurrences="7" value="r_a" /> + <ngram occurrences="7" value="n_í_" /> + <ngram occurrences="7" value="n_í" /> + <ngram occurrences="7" value="n_e" /> + <ngram occurrences="7" value="lj" /> + <ngram occurrences="7" value="ld" /> + <ngram occurrences="7" value="kun" /> + <ngram occurrences="7" value="jar" /> + <ngram occurrences="7" value="inni" /> + <ngram occurrences="7" value="ig" /> + <ngram occurrences="7" value="gre" /> + <ngram occurrences="7" value="gl" /> + <ngram occurrences="7" value="g_a" /> + <ngram occurrences="7" value="fækk" /> + <ngram occurrences="7" value="fæk" /> + <ngram occurrences="7" value="fn" /> + <ngram occurrences="7" value="fi" /> + <ngram occurrences="7" value="erður" /> + <ngram occurrences="7" value="erðu" /> + <ngram occurrences="7" value="eru_" /> + <ngram occurrences="7" value="eru" /> + <ngram occurrences="7" value="eng" /> + <ngram occurrences="7" value="en_" /> + <ngram occurrences="7" value="el" /> + <ngram occurrences="7" value="eið" /> + <ngram occurrences="7" value="avík" /> + <ngram occurrences="7" value="aví" /> + <ngram occurrences="7" value="as" /> + <ngram occurrences="7" value="a_e" /> + <ngram occurrences="7" value="_þar" /> + <ngram occurrences="7" value="_re" /> + <ngram occurrences="7" value="_fækk" /> + <ngram occurrences="7" value="_fæk" /> + <ngram occurrences="7" value="_fæ" /> + <ngram occurrences="7" value="_fj" /> + <ngram occurrences="7" value="_eru_" /> + <ngram occurrences="7" value="_eru" /> + <ngram occurrences="7" value="_en_" /> + <ngram occurrences="7" value="_br" /> + <ngram occurrences="6" value="þar_" /> + <ngram occurrences="6" value="ön" /> + <ngram occurrences="6" value="öl" /> + <ngram occurrences="6" value="ót" /> + <ngram occurrences="6" value="ð_s" /> + <ngram occurrences="6" value="ð_o" /> + <ngram occurrences="6" value="ð_f" /> + <ngram occurrences="6" value="ð_a" /> + <ngram occurrences="6" value="íkur" /> + <ngram occurrences="6" value="íku" /> + <ngram occurrences="6" value="í_g" /> + <ngram occurrences="6" value="é_" /> + <ngram occurrences="6" value="ær_" /> + <ngram occurrences="6" value="æ_" /> + <ngram occurrences="6" value="ár" /> + <ngram occurrences="6" value="á_v" /> + <ngram occurrences="6" value="ys" /> + <ngram occurrences="6" value="yk" /> + <ngram occurrences="6" value="víkur" /> +</ngrams> diff --git a/src/plugins/language/indonesian.klp b/src/plugins/language/indonesian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="729" value="a" /> + <ngram occurrences="673" value="_" /> + <ngram occurrences="372" value="n" /> + <ngram occurrences="314" value="i" /> + <ngram occurrences="309" value="e" /> + <ngram occurrences="221" value="r" /> + <ngram occurrences="217" value="u" /> + <ngram occurrences="215" value="t" /> + <ngram occurrences="214" value="k" /> + <ngram occurrences="185" value="an" /> + <ngram occurrences="175" value="s" /> + <ngram occurrences="164" value="m" /> + <ngram occurrences="162" value="d" /> + <ngram occurrences="156" value="g" /> + <ngram occurrences="131" value="a_" /> + <ngram occurrences="128" value="p" /> + <ngram occurrences="116" value="l" /> + <ngram occurrences="110" value="n_" /> + <ngram occurrences="108" value="ng" /> + <ngram occurrences="99" value="an_" /> + <ngram occurrences="98" value="i_" /> + <ngram occurrences="96" value="b" /> + <ngram occurrences="93" value="o" /> + <ngram occurrences="87" value="_d" /> + <ngram occurrences="86" value="er" /> + <ngram occurrences="79" value="h" /> + <ngram occurrences="78" value="_m" /> + <ngram occurrences="77" value="ka" /> + <ngram occurrences="70" value="_k" /> + <ngram occurrences="69" value="ar" /> + <ngram occurrences="69" value="_p" /> + <ngram occurrences="66" value="ta" /> + <ngram occurrences="65" value="en" /> + <ngram occurrences="65" value="di" /> + <ngram occurrences="62" value="me" /> + <ngram occurrences="59" value="_s" /> + <ngram occurrences="57" value="y" /> + <ngram occurrences="56" value="ang" /> + <ngram occurrences="56" value="_me" /> + <ngram occurrences="55" value="ra" /> + <ngram occurrences="55" value="at" /> + <ngram occurrences="53" value="j" /> + <ngram occurrences="53" value="ak" /> + <ngram occurrences="51" value="ga" /> + <ngram occurrences="50" value="in" /> + <ngram occurrences="50" value="da" /> + <ngram occurrences="50" value="_t" /> + <ngram occurrences="50" value="_b" /> + <ngram occurrences="49" value="_di" /> + <ngram occurrences="48" value="ng_" /> + <ngram occurrences="48" value="g_" /> + <ngram occurrences="46" value="ya" /> + <ngram occurrences="44" value="k_" /> + <ngram occurrences="42" value="un" /> + <ngram occurrences="42" value="la" /> + <ngram occurrences="42" value="h_" /> + <ngram occurrences="41" value="tu" /> + <ngram occurrences="41" value="ma" /> + <ngram occurrences="40" value="na" /> + <ngram occurrences="38" value="se" /> + <ngram occurrences="37" value="ri" /> + <ngram occurrences="37" value="ke" /> + <ngram occurrences="37" value="_a" /> + <ngram occurrences="36" value="u_" /> + <ngram occurrences="36" value="pe" /> + <ngram occurrences="35" value="ang_" /> + <ngram occurrences="35" value="ah" /> + <ngram occurrences="34" value="be" /> + <ngram occurrences="34" value="_ke" /> + <ngram occurrences="33" value="pa" /> + <ngram occurrences="33" value="_i" /> + <ngram occurrences="32" value="ja" /> + <ngram occurrences="32" value="as" /> + <ngram occurrences="32" value="al" /> + <ngram occurrences="31" value="sa" /> + <ngram occurrences="31" value="r_" /> + <ngram occurrences="31" value="men" /> + <ngram occurrences="31" value="ia" /> + <ngram occurrences="31" value="_se" /> + <ngram occurrences="30" value="si" /> + <ngram occurrences="30" value="s_" /> + <ngram occurrences="30" value="_pe" /> + <ngram occurrences="29" value="ti" /> + <ngram occurrences="29" value="c" /> + <ngram occurrences="29" value="_men" /> + <ngram occurrences="28" value="t_" /> + <ngram occurrences="28" value="it" /> + <ngram occurrences="27" value="ny" /> + <ngram occurrences="27" value="em" /> + <ngram occurrences="27" value="ba" /> + <ngram occurrences="26" value="kan" /> + <ngram occurrences="26" value="di_" /> + <ngram occurrences="26" value="am" /> + <ngram occurrences="25" value="te" /> + <ngram occurrences="25" value="ak_" /> + <ngram occurrences="25" value="_ka" /> + <ngram occurrences="24" value="kan_" /> + <ngram occurrences="24" value="eng" /> + <ngram occurrences="24" value="_da" /> + <ngram occurrences="23" value="nga" /> + <ngram occurrences="23" value="ad" /> + <ngram occurrences="22" value="li" /> + <ngram occurrences="22" value="is" /> + <ngram occurrences="22" value="el" /> + <ngram occurrences="22" value="ber" /> + <ngram occurrences="22" value="ah_" /> + <ngram occurrences="22" value="_be" /> + <ngram occurrences="21" value="ya_" /> + <ngram occurrences="21" value="nt" /> + <ngram occurrences="21" value="ni" /> + <ngram occurrences="21" value="bu" /> + <ngram occurrences="21" value="ata" /> + <ngram occurrences="20" value="a_m" /> + <ngram occurrences="20" value="_j" /> + <ngram occurrences="19" value="us" /> + <ngram occurrences="19" value="su" /> + <ngram occurrences="19" value="ran" /> + <ngram occurrences="19" value="nya" /> + <ngram occurrences="19" value="ik" /> + <ngram occurrences="19" value="ha" /> + <ngram occurrences="19" value="gan" /> + <ngram occurrences="19" value="at_" /> + <ngram occurrences="19" value="ari" /> + <ngram occurrences="19" value="ara" /> + <ngram occurrences="19" value="ap" /> + <ngram occurrences="19" value="_y" /> + <ngram occurrences="18" value="to" /> + <ngram occurrences="18" value="ru" /> + <ngram occurrences="18" value="po" /> + <ngram occurrences="18" value="era" /> + <ngram occurrences="18" value="dan" /> + <ngram occurrences="18" value="_ya" /> + <ngram occurrences="18" value="_te" /> + <ngram occurrences="18" value="_ber" /> + <ngram occurrences="17" value="yang" /> + <ngram occurrences="17" value="yan" /> + <ngram occurrences="17" value="ur" /> + <ngram occurrences="17" value="uk" /> + <ngram occurrences="17" value="ter" /> + <ngram occurrences="17" value="nd" /> + <ngram occurrences="17" value="na_" /> + <ngram occurrences="17" value="es" /> + <ngram occurrences="17" value="_di_" /> + <ngram occurrences="17" value="_c" /> + <ngram occurrences="16" value="yang_" /> + <ngram occurrences="16" value="ung" /> + <ngram occurrences="16" value="ol" /> + <ngram occurrences="16" value="ngan" /> + <ngram occurrences="16" value="l_" /> + <ngram occurrences="16" value="ala" /> + <ngram occurrences="16" value="a_s" /> + <ngram occurrences="16" value="_ta" /> + <ngram occurrences="15" value="per" /> + <ngram occurrences="15" value="nya_" /> + <ngram occurrences="15" value="dan_" /> + <ngram occurrences="15" value="_yang" /> + <ngram occurrences="15" value="_yan" /> + <ngram occurrences="15" value="_ter" /> + <ngram occurrences="15" value="_ba" /> + <ngram occurrences="14" value="tu_" /> + <ngram occurrences="14" value="ta_" /> + <ngram occurrences="14" value="ok" /> + <ngram occurrences="14" value="ni_" /> + <ngram occurrences="14" value="lu" /> + <ngram occurrences="14" value="ko" /> + <ngram occurrences="14" value="ju" /> + <ngram occurrences="14" value="itu" /> + <ngram occurrences="14" value="i_k" /> + <ngram occurrences="14" value="enga" /> + <ngram occurrences="14" value="ek" /> + <ngram occurrences="14" value="du" /> + <ngram occurrences="14" value="de" /> + <ngram occurrences="14" value="_in" /> + <ngram occurrences="14" value="_dan_" /> + <ngram occurrences="14" value="_dan" /> + <ngram occurrences="13" value="ut" /> + <ngram occurrences="13" value="si_" /> + <ngram occurrences="13" value="re" /> + <ngram occurrences="13" value="rang" /> + <ngram occurrences="13" value="pen" /> + <ngram occurrences="13" value="n_d" /> + <ngram occurrences="13" value="m_" /> + <ngram occurrences="13" value="ku" /> + <ngram occurrences="13" value="kar" /> + <ngram occurrences="13" value="ina" /> + <ngram occurrences="13" value="ia_" /> + <ngram occurrences="13" value="ge" /> + <ngram occurrences="13" value="eri" /> + <ngram occurrences="13" value="e_" /> + <ngram occurrences="13" value="da_" /> + <ngram occurrences="13" value="ai" /> + <ngram occurrences="13" value="a_p" /> + <ngram occurrences="13" value="a_i" /> + <ngram occurrences="13" value="_u" /> + <ngram occurrences="13" value="_ma" /> + <ngram occurrences="12" value="w" /> + <ngram occurrences="12" value="ul" /> + <ngram occurrences="12" value="ua" /> + <ngram occurrences="12" value="rin" /> + <ngram occurrences="12" value="ri_" /> + <ngram occurrences="12" value="rang_" /> + <ngram occurrences="12" value="pr" /> + <ngram occurrences="12" value="pol" /> + <ngram occurrences="12" value="or" /> + <ngram occurrences="12" value="ngan_" /> + <ngram occurrences="12" value="n_p" /> + <ngram occurrences="12" value="mp" /> + <ngram occurrences="12" value="itu_" /> + <ngram occurrences="12" value="ini" /> + <ngram occurrences="12" value="gi" /> + <ngram occurrences="12" value="gan_" /> + <ngram occurrences="12" value="et" /> + <ngram occurrences="12" value="ca" /> + <ngram occurrences="12" value="an_d" /> + <ngram occurrences="12" value="a_me" /> + <ngram occurrences="12" value="a_d" /> + <ngram occurrences="12" value="_po" /> + <ngram occurrences="12" value="_pen" /> + <ngram occurrences="11" value="us_" /> + <ngram occurrences="11" value="tan" /> + <ngram occurrences="11" value="ngg" /> + <ngram occurrences="11" value="ng_d" /> + <ngram occurrences="11" value="n_k" /> + <ngram occurrences="11" value="mi" /> + <ngram occurrences="11" value="lan" /> + <ngram occurrences="11" value="ini_" /> + <ngram occurrences="11" value="ina_" /> + <ngram occurrences="11" value="i_m" /> + <ngram occurrences="11" value="i_d" /> + <ngram occurrences="11" value="gg" /> + <ngram occurrences="11" value="g_d" /> + <ngram occurrences="11" value="ena" /> + <ngram occurrences="11" value="ed" /> + <ngram occurrences="11" value="d_" /> + <ngram occurrences="11" value="as_" /> + <ngram occurrences="11" value="ar_" /> + <ngram occurrences="11" value="an_p" /> + <ngram occurrences="11" value="ama" /> + <ngram occurrences="11" value="aka" /> + <ngram occurrences="11" value="ab" /> + <ngram occurrences="11" value="_per" /> + <ngram occurrences="11" value="_l" /> + <ngram occurrences="11" value="_ja" /> + <ngram occurrences="11" value="_ini_" /> + <ngram occurrences="11" value="_ini" /> + <ngram occurrences="10" value="zarin" /> + <ngram occurrences="10" value="zari" /> + <ngram occurrences="10" value="zar" /> + <ngram occurrences="10" value="za" /> + <ngram occurrences="10" value="z" /> + <ngram occurrences="10" value="wa" /> + <ngram occurrences="10" value="uk_" /> + <ngram occurrences="10" value="uh" /> + <ngram occurrences="10" value="rt" /> + <ngram occurrences="10" value="rina_" /> + <ngram occurrences="10" value="rina" /> + <ngram occurrences="10" value="ngk" /> + <ngram occurrences="10" value="n_b" /> + <ngram occurrences="10" value="mu" /> + <ngram occurrences="10" value="mem" /> + <ngram occurrences="10" value="ki" /> + <ngram occurrences="10" value="im" /> + <ngram occurrences="10" value="ika" /> + <ngram occurrences="10" value="i_b" /> + <ngram occurrences="10" value="gk" /> + <ngram occurrences="10" value="f" /> + <ngram occurrences="10" value="eru" /> + <ngram occurrences="10" value="ela" /> + <ngram occurrences="10" value="arina" /> + <ngram occurrences="10" value="arin" /> + <ngram occurrences="10" value="ang_d" /> + <ngram occurrences="10" value="an_b" /> + <ngram occurrences="10" value="al_" /> + <ngram occurrences="10" value="ag" /> + <ngram occurrences="10" value="adi" /> + <ngram occurrences="10" value="_zari" /> + <ngram occurrences="10" value="_zar" /> + <ngram occurrences="10" value="_za" /> + <ngram occurrences="10" value="_z" /> + <ngram occurrences="10" value="_pol" /> + <ngram occurrences="10" value="_n" /> + <ngram occurrences="10" value="_mem" /> + <ngram occurrences="10" value="_g" /> + <ngram occurrences="9" value="sm" /> + <ngram occurrences="9" value="pu" /> + <ngram occurrences="9" value="os" /> + <ngram occurrences="9" value="oh_" /> + <ngram occurrences="9" value="oh" /> + <ngram occurrences="9" value="o_" /> + <ngram occurrences="9" value="ntu" /> + <ngram occurrences="9" value="ng_di" /> + <ngram occurrences="9" value="n_t" /> + <ngram occurrences="9" value="man" /> + <ngram occurrences="9" value="ma_" /> + <ngram occurrences="9" value="jadi" /> + <ngram occurrences="9" value="jad" /> + <ngram occurrences="9" value="ing" /> + <ngram occurrences="9" value="il" /> + <ngram occurrences="9" value="i_s" /> + <ngram occurrences="9" value="ga_" /> + <ngram occurrences="9" value="g_di" /> + <ngram occurrences="9" value="engan" /> + <ngram occurrences="9" value="eb" /> + <ngram occurrences="9" value="dia" /> + <ngram occurrences="9" value="asi" /> + <ngram occurrences="9" value="apa" /> + <ngram occurrences="9" value="an_t" /> + <ngram occurrences="9" value="a_t" /> + <ngram occurrences="9" value="a_k" /> + <ngram occurrences="9" value="_sa" /> + <ngram occurrences="9" value="_pa" /> + <ngram occurrences="9" value="_itu_" /> + <ngram occurrences="9" value="_itu" /> + <ngram occurrences="9" value="_it" /> + <ngram occurrences="9" value="_de" /> + <ngram occurrences="8" value="uh_" /> + <ngram occurrences="8" value="u_m" /> + <ngram occurrences="8" value="tak" /> + <ngram occurrences="8" value="st" /> + <ngram occurrences="8" value="rk" /> + <ngram occurrences="8" value="rd" /> + <ngram occurrences="8" value="ra_" /> + <ngram occurrences="8" value="pi" /> + <ngram occurrences="8" value="pat" /> + <ngram occurrences="8" value="p_" /> + <ngram occurrences="8" value="oko" /> + <ngram occurrences="8" value="nu" /> + <ngram occurrences="8" value="nj" /> + <ngram occurrences="8" value="n_s" /> + <ngram occurrences="8" value="n_pe" /> + <ngram occurrences="8" value="n_m" /> + <ngram occurrences="8" value="meng" /> + <ngram occurrences="8" value="mb" /> + <ngram occurrences="8" value="le" /> + <ngram occurrences="8" value="kal" /> + <ngram occurrences="8" value="isi" /> + <ngram occurrences="8" value="ip" /> + <ngram occurrences="8" value="ian" /> + <ngram occurrences="8" value="ep" /> + <ngram occurrences="8" value="eny" /> + <ngram occurrences="8" value="emb" /> + <ngram occurrences="8" value="aya" /> + <ngram occurrences="8" value="ay" /> + <ngram occurrences="8" value="au" /> + <ngram occurrences="8" value="ant" /> + <ngram occurrences="8" value="an_k" /> + <ngram occurrences="8" value="aga" /> + <ngram occurrences="8" value="ada" /> + <ngram occurrences="8" value="a_se" /> + <ngram occurrences="8" value="a_a" /> + <ngram occurrences="8" value="_r" /> + <ngram occurrences="8" value="_meng" /> + <ngram occurrences="8" value="_h" /> + <ngram occurrences="8" value="_ad" /> + <ngram occurrences="7" value="ung_" /> + <ngram occurrences="7" value="um" /> + <ngram occurrences="7" value="uga" /> + <ngram occurrences="7" value="ug" /> + <ngram occurrences="7" value="tuk_" /> + <ngram occurrences="7" value="tuk" /> + <ngram occurrences="7" value="toko" /> + <ngram occurrences="7" value="tok" /> + <ngram occurrences="7" value="tak_" /> + <ngram occurrences="7" value="sia" /> + <ngram occurrences="7" value="ser" /> + <ngram occurrences="7" value="san" /> + <ngram occurrences="7" value="ro" /> + <ngram occurrences="7" value="rl" /> + <ngram occurrences="7" value="rah" /> + <ngram occurrences="7" value="r_d" /> + <ngram occurrences="7" value="peng" /> + <ngram occurrences="7" value="pat_" /> + <ngram occurrences="7" value="pan" /> + <ngram occurrences="7" value="ot" /> + <ngram occurrences="7" value="or_" /> + <ngram occurrences="7" value="ntuk_" /> + <ngram occurrences="7" value="ntuk" /> + <ngram occurrences="7" value="ngka" /> + <ngram occurrences="7" value="ngga" /> + <ngram occurrences="7" value="ng_m" /> + <ngram occurrences="7" value="ng_k" /> + <ngram occurrences="7" value="nda" /> + <ngram occurrences="7" value="n_me" /> + <ngram occurrences="7" value="meny" /> + <ngram occurrences="7" value="lu_" /> + <ngram occurrences="7" value="lam" /> + <ngram occurrences="7" value="k_d" /> + <ngram occurrences="7" value="jak" /> + <ngram occurrences="7" value="jadi_" /> + <ngram occurrences="7" value="ita" /> + <ngram occurrences="7" value="ih" /> + <ngram occurrences="7" value="ib" /> + <ngram occurrences="7" value="i_p" /> + <ngram occurrences="7" value="i_me" /> + <ngram occurrences="7" value="i_a" /> + <ngram occurrences="7" value="gka" /> + <ngram occurrences="7" value="gga" /> + <ngram occurrences="7" value="ger" /> + <ngram occurrences="7" value="g_m" /> + <ngram occurrences="7" value="g_k" /> +</ngrams> diff --git a/src/plugins/language/irish.klp b/src/plugins/language/irish.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="823" value="_" /> + <ngram occurrences="557" value="a" /> + <ngram occurrences="310" value="i" /> + <ngram occurrences="273" value="h" /> + <ngram occurrences="247" value="n" /> + <ngram occurrences="199" value="_a" /> + <ngram occurrences="190" value="r" /> + <ngram occurrences="187" value="s" /> + <ngram occurrences="171" value="t" /> + <ngram occurrences="170" value="e" /> + <ngram occurrences="145" value="c" /> + <ngram occurrences="142" value="l" /> + <ngram occurrences="121" value="g" /> + <ngram occurrences="121" value="a_" /> + <ngram occurrences="117" value="o" /> + <ngram occurrences="117" value="n_" /> + <ngram occurrences="113" value="d" /> + <ngram occurrences="100" value="m" /> + <ngram occurrences="87" value="b" /> + <ngram occurrences="87" value="an" /> + <ngram occurrences="86" value="u" /> + <ngram occurrences="83" value="h_" /> + <ngram occurrences="81" value="í" /> + <ngram occurrences="79" value="é" /> + <ngram occurrences="79" value="_s" /> + <ngram occurrences="78" value="ai" /> + <ngram occurrences="77" value="ch" /> + <ngram occurrences="75" value="ea" /> + <ngram occurrences="73" value="á" /> + <ngram occurrences="71" value="r_" /> + <ngram occurrences="65" value="_b" /> + <ngram occurrences="60" value="s_" /> + <ngram occurrences="59" value="ar" /> + <ngram occurrences="58" value="f" /> + <ngram occurrences="58" value="_t" /> + <ngram occurrences="57" value="_c" /> + <ngram occurrences="56" value="in" /> + <ngram occurrences="54" value="an_" /> + <ngram occurrences="52" value="_m" /> + <ngram occurrences="51" value="í_" /> + <ngram occurrences="51" value="_d" /> + <ngram occurrences="50" value="bh" /> + <ngram occurrences="49" value="ac" /> + <ngram occurrences="48" value="ag" /> + <ngram occurrences="48" value="_a_" /> + <ngram occurrences="45" value="th" /> + <ngram occurrences="45" value="_an" /> + <ngram occurrences="44" value="ir" /> + <ngram occurrences="44" value="ha" /> + <ngram occurrences="41" value="ach" /> + <ngram occurrences="39" value="_l" /> + <ngram occurrences="38" value="é_" /> + <ngram occurrences="38" value="_f" /> + <ngram occurrences="38" value="_bh" /> + <ngram occurrences="38" value="_an_" /> + <ngram occurrences="38" value="_ag" /> + <ngram occurrences="37" value="l_" /> + <ngram occurrences="37" value="e_" /> + <ngram occurrences="35" value="g_" /> + <ngram occurrences="34" value="le" /> + <ngram occurrences="34" value="_i" /> + <ngram occurrences="33" value="p" /> + <ngram occurrences="33" value="is" /> + <ngram occurrences="33" value="il" /> + <ngram occurrences="32" value="na" /> + <ngram occurrences="32" value="id" /> + <ngram occurrences="32" value="ar_" /> + <ngram occurrences="31" value="ó" /> + <ngram occurrences="30" value="mh" /> + <ngram occurrences="30" value="_n" /> + <ngram occurrences="29" value="_g" /> + <ngram occurrences="28" value="t_" /> + <ngram occurrences="28" value="r_a" /> + <ngram occurrences="28" value="nn" /> + <ngram occurrences="28" value="_ch" /> + <ngram occurrences="27" value="ch_" /> + <ngram occurrences="26" value="á_" /> + <ngram occurrences="26" value="o_" /> + <ngram occurrences="26" value="it" /> + <ngram occurrences="26" value="ir_" /> + <ngram occurrences="26" value="dh" /> + <ngram occurrences="26" value="ach_" /> + <ngram occurrences="25" value="sé" /> + <ngram occurrences="25" value="d_" /> + <ngram occurrences="25" value="_sé" /> + <ngram occurrences="25" value="_ar" /> + <ngram occurrences="24" value="ú" /> + <ngram occurrences="24" value="ái" /> + <ngram occurrences="24" value="sé_" /> + <ngram occurrences="24" value="h_a" /> + <ngram occurrences="24" value="ei" /> + <ngram occurrences="24" value="am" /> + <ngram occurrences="24" value="_sé_" /> + <ngram occurrences="24" value="_le" /> + <ngram occurrences="23" value="ra" /> + <ngram occurrences="23" value="he" /> + <ngram occurrences="23" value="al" /> + <ngram occurrences="22" value="ui" /> + <ngram occurrences="22" value="ta" /> + <ngram occurrences="22" value="ean" /> + <ngram occurrences="21" value="éa" /> + <ngram occurrences="21" value="us" /> + <ngram occurrences="21" value="ig" /> + <ngram occurrences="21" value="gu" /> + <ngram occurrences="21" value="_p" /> + <ngram occurrences="20" value="te" /> + <ngram occurrences="20" value="se" /> + <ngram occurrences="20" value="n_a" /> + <ngram occurrences="20" value="as" /> + <ngram occurrences="20" value="a_a" /> + <ngram occurrences="19" value="oi" /> + <ngram occurrences="19" value="nn_" /> + <ngram occurrences="19" value="hu" /> + <ngram occurrences="19" value="hai" /> + <ngram occurrences="19" value="de" /> + <ngram occurrences="19" value="ag_" /> + <ngram occurrences="18" value="éi" /> + <ngram occurrences="18" value="us_" /> + <ngram occurrences="18" value="st" /> + <ngram occurrences="18" value="sa" /> + <ngram occurrences="18" value="ith" /> + <ngram occurrences="18" value="in_" /> + <ngram occurrences="18" value="gus_" /> + <ngram occurrences="18" value="gus" /> + <ngram occurrences="18" value="ga" /> + <ngram occurrences="18" value="agus_" /> + <ngram occurrences="18" value="agus" /> + <ngram occurrences="18" value="agu" /> + <ngram occurrences="18" value="a_d" /> + <ngram occurrences="18" value="a_b" /> + <ngram occurrences="18" value="_ar_" /> + <ngram occurrences="18" value="_agus" /> + <ngram occurrences="18" value="_agu" /> + <ngram occurrences="17" value="ua" /> + <ngram occurrences="17" value="is_" /> + <ngram occurrences="16" value="tha" /> + <ngram occurrences="16" value="s_a" /> + <ngram occurrences="16" value="rt" /> + <ngram occurrences="16" value="i_" /> + <ngram occurrences="16" value="há" /> + <ngram occurrences="16" value="go" /> + <ngram occurrences="16" value="dh_" /> + <ngram occurrences="16" value="_ac" /> + <ngram occurrences="15" value="ío" /> + <ngram occurrences="15" value="tá_" /> + <ngram occurrences="15" value="tá" /> + <ngram occurrences="15" value="ní" /> + <ngram occurrences="15" value="na_" /> + <ngram occurrences="15" value="ma" /> + <ngram occurrences="15" value="m_" /> + <ngram occurrences="15" value="il_" /> + <ngram occurrences="15" value="ia" /> + <ngram occurrences="15" value="hí" /> + <ngram occurrences="15" value="go_" /> + <ngram occurrences="15" value="gh" /> + <ngram occurrences="15" value="bhí" /> + <ngram occurrences="15" value="at" /> + <ngram occurrences="15" value="ann" /> + <ngram occurrences="15" value="ad" /> + <ngram occurrences="15" value="a_bh" /> + <ngram occurrences="15" value="_ní" /> + <ngram occurrences="15" value="_go" /> + <ngram occurrences="15" value="_bhí" /> + <ngram occurrences="14" value="í_a" /> + <ngram occurrences="14" value="re" /> + <ngram occurrences="14" value="n_t" /> + <ngram occurrences="14" value="le_" /> + <ngram occurrences="14" value="la" /> + <ngram occurrences="14" value="igh" /> + <ngram occurrences="14" value="hí_" /> + <ngram occurrences="14" value="fa" /> + <ngram occurrences="14" value="ear" /> + <ngram occurrences="14" value="each" /> + <ngram occurrences="14" value="eac" /> + <ngram occurrences="14" value="bhí_" /> + <ngram occurrences="14" value="amh" /> + <ngram occurrences="14" value="ait" /> + <ngram occurrences="14" value="_é" /> + <ngram occurrences="14" value="_go_" /> + <ngram occurrences="14" value="_bhí_" /> + <ngram occurrences="14" value="_ag_" /> + <ngram occurrences="13" value="ti" /> + <ngram occurrences="13" value="rí" /> + <ngram occurrences="13" value="mh_" /> + <ngram occurrences="13" value="hea" /> + <ngram occurrences="13" value="fh" /> + <ngram occurrences="13" value="eo" /> + <ngram occurrences="13" value="c_" /> + <ngram occurrences="13" value="ann_" /> + <ngram occurrences="13" value="_fh" /> + <ngram occurrences="13" value="_a_d" /> + <ngram occurrences="13" value="_a_bh" /> + <ngram occurrences="13" value="_a_b" /> + <ngram occurrences="12" value="th_" /> + <ngram occurrences="12" value="ng" /> + <ngram occurrences="12" value="inn" /> + <ngram occurrences="12" value="hái" /> + <ngram occurrences="12" value="ho" /> + <ngram occurrences="12" value="hi" /> + <ngram occurrences="12" value="h_t" /> + <ngram occurrences="12" value="h_s" /> + <ngram occurrences="12" value="as_" /> + <ngram occurrences="12" value="air" /> + <ngram occurrences="12" value="_ó" /> + <ngram occurrences="12" value="_tá_" /> + <ngram occurrences="12" value="_tá" /> + <ngram occurrences="12" value="_se" /> + <ngram occurrences="12" value="_de" /> + <ngram occurrences="11" value="án" /> + <ngram occurrences="11" value="sc" /> + <ngram occurrences="11" value="rai" /> + <ngram occurrences="11" value="r_an" /> + <ngram occurrences="11" value="or" /> + <ngram occurrences="11" value="n_n" /> + <ngram occurrences="11" value="ith_" /> + <ngram occurrences="11" value="ir_a" /> + <ngram occurrences="11" value="ha_" /> + <ngram occurrences="11" value="cha" /> + <ngram occurrences="11" value="ar_a" /> + <ngram occurrences="11" value="aith" /> + <ngram occurrences="11" value="aig" /> + <ngram occurrences="11" value="aid" /> + <ngram occurrences="11" value="_r" /> + <ngram occurrences="11" value="_in" /> + <ngram occurrences="11" value="_ach_" /> + <ngram occurrences="11" value="_ach" /> + <ngram occurrences="10" value="é_a" /> + <ngram occurrences="10" value="ta_" /> + <ngram occurrences="10" value="t_a" /> + <ngram occurrences="10" value="sa_" /> + <ngram occurrences="10" value="r_an_" /> + <ngram occurrences="10" value="om" /> + <ngram occurrences="10" value="l_a" /> + <ngram occurrences="10" value="igh_" /> + <ngram occurrences="10" value="hé" /> + <ngram occurrences="10" value="hf" /> + <ngram occurrences="10" value="gh_" /> + <ngram occurrences="10" value="d_a" /> + <ngram occurrences="10" value="ca" /> + <ngram occurrences="10" value="be" /> + <ngram occurrences="10" value="art" /> + <ngram occurrences="10" value="amh_" /> + <ngram occurrences="10" value="al_" /> + <ngram occurrences="10" value="air_" /> + <ngram occurrences="10" value="ain" /> + <ngram occurrences="10" value="aigh" /> + <ngram occurrences="10" value="acha" /> + <ngram occurrences="10" value="a_c" /> + <ngram occurrences="10" value="_ta" /> + <ngram occurrences="10" value="_ma" /> + <ngram occurrences="10" value="_dh" /> + <ngram occurrences="9" value="án_" /> + <ngram occurrences="9" value="uil" /> + <ngram occurrences="9" value="tea" /> + <ngram occurrences="9" value="sea" /> + <ngram occurrences="9" value="rea" /> + <ngram occurrences="9" value="r_s" /> + <ngram occurrences="9" value="nt" /> + <ngram occurrences="9" value="ne" /> + <ngram occurrences="9" value="n_s" /> + <ngram occurrences="9" value="n_f" /> + <ngram occurrences="9" value="lá" /> + <ngram occurrences="9" value="li" /> + <ngram occurrences="9" value="io" /> + <ngram occurrences="9" value="im" /> + <ngram occurrences="9" value="ile" /> + <ngram occurrences="9" value="idh_" /> + <ngram occurrences="9" value="idh" /> + <ngram occurrences="9" value="id_" /> + <ngram occurrences="9" value="ht" /> + <ngram occurrences="9" value="har" /> + <ngram occurrences="9" value="ean_" /> + <ngram occurrences="9" value="eag" /> + <ngram occurrences="9" value="cu" /> + <ngram occurrences="9" value="chu" /> + <ngram occurrences="9" value="bhf" /> + <ngram occurrences="9" value="bea" /> + <ngram occurrences="9" value="aga" /> + <ngram occurrences="9" value="_o" /> + <ngram occurrences="9" value="_mh" /> + <ngram occurrences="9" value="_is" /> + <ngram occurrences="9" value="_chu" /> + <ngram occurrences="9" value="_bhf" /> + <ngram occurrences="8" value="úi" /> + <ngram occurrences="8" value="ós" /> + <ngram occurrences="8" value="í_s" /> + <ngram occurrences="8" value="éan" /> + <ngram occurrences="8" value="sí" /> + <ngram occurrences="8" value="si" /> + <ngram occurrences="8" value="s_d" /> + <ngram occurrences="8" value="ri" /> + <ngram occurrences="8" value="ra_" /> + <ngram occurrences="8" value="r_a_" /> + <ngram occurrences="8" value="on" /> + <ngram occurrences="8" value="oc" /> + <ngram occurrences="8" value="nn_a" /> + <ngram occurrences="8" value="n_b" /> + <ngram occurrences="8" value="mé_" /> + <ngram occurrences="8" value="mé" /> + <ngram occurrences="8" value="mu" /> + <ngram occurrences="8" value="mha" /> + <ngram occurrences="8" value="ll" /> + <ngram occurrences="8" value="ist" /> + <ngram occurrences="8" value="ile_" /> + <ngram occurrences="8" value="ic" /> + <ngram occurrences="8" value="hr" /> + <ngram occurrences="8" value="hean" /> + <ngram occurrences="8" value="h_m" /> + <ngram occurrences="8" value="di" /> + <ngram occurrences="8" value="bhe" /> + <ngram occurrences="8" value="an_t" /> + <ngram occurrences="8" value="ail" /> + <ngram occurrences="8" value="a_f" /> + <ngram occurrences="8" value="a_de" /> + <ngram occurrences="8" value="_ti" /> + <ngram occurrences="8" value="_th" /> + <ngram occurrences="8" value="_sí" /> + <ngram occurrences="8" value="_na" /> + <ngram occurrences="8" value="_mé_" /> + <ngram occurrences="8" value="_mé" /> + <ngram occurrences="8" value="_fa" /> + <ngram occurrences="8" value="_bea" /> + <ngram occurrences="8" value="_be" /> + <ngram occurrences="8" value="_ar_a" /> + <ngram occurrences="7" value="ú_" /> + <ngram occurrences="7" value="é_c" /> + <ngram occurrences="7" value="áid" /> + <ngram occurrences="7" value="y" /> + <ngram occurrences="7" value="te_" /> + <ngram occurrences="7" value="sí_" /> + <ngram occurrences="7" value="ste" /> + <ngram occurrences="7" value="seo" /> + <ngram occurrences="7" value="sean" /> + <ngram occurrences="7" value="s_an_" /> + <ngram occurrences="7" value="s_an" /> + <ngram occurrences="7" value="rt_" /> + <ngram occurrences="7" value="pa" /> + <ngram occurrences="7" value="ol" /> + <ngram occurrences="7" value="ní_" /> + <ngram occurrences="7" value="n_ní" /> + <ngram occurrences="7" value="lt" /> + <ngram occurrences="7" value="lei" /> + <ngram occurrences="7" value="iste" /> + <ngram occurrences="7" value="ing" /> + <ngram occurrences="7" value="hó" /> + <ngram occurrences="7" value="hui" /> + <ngram occurrences="7" value="hua" /> + <ngram occurrences="7" value="ha_a" /> + <ngram occurrences="7" value="fai" /> + <ngram occurrences="7" value="en" /> + <ngram occurrences="7" value="eir_" /> + <ngram occurrences="7" value="eir" /> + <ngram occurrences="7" value="eann" /> + <ngram occurrences="7" value="eacha" /> + <ngram occurrences="7" value="deir_" /> + <ngram occurrences="7" value="deir" /> + <ngram occurrences="7" value="dei" /> + <ngram occurrences="7" value="dea" /> + <ngram occurrences="7" value="cht" /> + <ngram occurrences="7" value="ba" /> + <ngram occurrences="7" value="as_a" /> + <ngram occurrences="7" value="ana" /> + <ngram occurrences="7" value="aith_" /> + <ngram occurrences="7" value="air_a" /> + <ngram occurrences="7" value="aigh_" /> + <ngram occurrences="7" value="adh_" /> + <ngram occurrences="7" value="adh" /> + <ngram occurrences="7" value="a_s" /> + <ngram occurrences="7" value="a_m" /> + <ngram occurrences="7" value="a_g" /> + <ngram occurrences="7" value="a_dei" /> + <ngram occurrences="7" value="a_ch" /> + <ngram occurrences="7" value="_éi" /> + <ngram occurrences="7" value="_sí_" /> + <ngram occurrences="7" value="_si" /> + <ngram occurrences="7" value="_sc" /> + <ngram occurrences="7" value="_sa" /> + <ngram occurrences="7" value="_ní_" /> + <ngram occurrences="7" value="_mu" /> + <ngram occurrences="7" value="_lei" /> + <ngram occurrences="7" value="_deir" /> + <ngram occurrences="7" value="_dei" /> + <ngram occurrences="7" value="_bhe" /> + <ngram occurrences="7" value="_at" /> + <ngram occurrences="7" value="_an_t" /> + <ngram occurrences="7" value="_am" /> + <ngram occurrences="7" value="_ai" /> + <ngram occurrences="7" value="_a_de" /> + <ngram occurrences="6" value="óst" /> + <ngram occurrences="6" value="éal" /> + <ngram occurrences="6" value="é_s" /> + <ngram occurrences="6" value="áil" /> + <ngram occurrences="6" value="uí_a" /> + <ngram occurrences="6" value="uí_" /> + <ngram occurrences="6" value="uí" /> + <ngram occurrences="6" value="uil_" /> + <ngram occurrences="6" value="uid_" /> + <ngram occurrences="6" value="uid" /> + <ngram occurrences="6" value="uai" /> + <ngram occurrences="6" value="tú" /> +</ngrams> diff --git a/src/plugins/language/italian.klp b/src/plugins/language/italian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="899" value="_" /> + <ngram occurrences="549" value="a" /> + <ngram occurrences="412" value="e" /> + <ngram occurrences="393" value="i" /> + <ngram occurrences="344" value="o" /> + <ngram occurrences="286" value="l" /> + <ngram occurrences="248" value="n" /> + <ngram occurrences="246" value="r" /> + <ngram occurrences="240" value="a_" /> + <ngram occurrences="210" value="s" /> + <ngram occurrences="206" value="c" /> + <ngram occurrences="185" value="e_" /> + <ngram occurrences="184" value="t" /> + <ngram occurrences="172" value="d" /> + <ngram occurrences="151" value="o_" /> + <ngram occurrences="131" value="i_" /> + <ngram occurrences="124" value="u" /> + <ngram occurrences="121" value="v" /> + <ngram occurrences="105" value="p" /> + <ngram occurrences="105" value="m" /> + <ngram occurrences="97" value="_c" /> + <ngram occurrences="96" value="_s" /> + <ngram occurrences="93" value="_d" /> + <ngram occurrences="84" value="_a" /> + <ngram occurrences="67" value="l_" /> + <ngram occurrences="65" value="la" /> + <ngram occurrences="62" value="_p" /> + <ngram occurrences="61" value="g" /> + <ngram occurrences="59" value="er" /> + <ngram occurrences="59" value="ar" /> + <ngram occurrences="57" value="an" /> + <ngram occurrences="56" value="h" /> + <ngram occurrences="55" value="_l" /> + <ngram occurrences="53" value="co" /> + <ngram occurrences="52" value="ri" /> + <ngram occurrences="52" value="_m" /> + <ngram occurrences="51" value="re" /> + <ngram occurrences="51" value="ll" /> + <ngram occurrences="51" value="la_" /> + <ngram occurrences="51" value="_i" /> + <ngram occurrences="47" value="no" /> + <ngram occurrences="46" value="ra" /> + <ngram occurrences="46" value="di" /> + <ngram occurrences="46" value="ch" /> + <ngram occurrences="45" value="el" /> + <ngram occurrences="45" value="_e" /> + <ngram occurrences="44" value="to" /> + <ngram occurrences="43" value="va" /> + <ngram occurrences="43" value="se" /> + <ngram occurrences="43" value="n_" /> + <ngram occurrences="43" value="b" /> + <ngram occurrences="42" value="ia" /> + <ngram occurrences="42" value="_v" /> + <ngram occurrences="42" value="_di" /> + <ngram occurrences="41" value="f" /> + <ngram occurrences="41" value="_n" /> + <ngram occurrences="40" value="in" /> + <ngram occurrences="38" value="av" /> + <ngram occurrences="38" value="al" /> + <ngram occurrences="38" value="_co" /> + <ngram occurrences="37" value="do" /> + <ngram occurrences="36" value="to_" /> + <ngram occurrences="36" value="on" /> + <ngram occurrences="35" value="re_" /> + <ngram occurrences="35" value="or" /> + <ngram occurrences="35" value="na" /> + <ngram occurrences="34" value="ta" /> + <ngram occurrences="34" value="li" /> + <ngram occurrences="34" value="en" /> + <ngram occurrences="34" value="ca" /> + <ngram occurrences="33" value="pe" /> + <ngram occurrences="32" value="si" /> + <ngram occurrences="32" value="da" /> + <ngram occurrences="31" value="ve" /> + <ngram occurrences="31" value="va_" /> + <ngram occurrences="31" value="ma" /> + <ngram occurrences="30" value="sa" /> + <ngram occurrences="30" value="ol" /> + <ngram occurrences="30" value="lla" /> + <ngram occurrences="30" value="le" /> + <ngram occurrences="30" value="de" /> + <ngram occurrences="30" value="as" /> + <ngram occurrences="29" value="cc" /> + <ngram occurrences="28" value="lla_" /> + <ngram occurrences="28" value="io" /> + <ngram occurrences="28" value="_f" /> + <ngram occurrences="27" value="il" /> + <ngram occurrences="27" value="a_c" /> + <ngram occurrences="27" value="_u" /> + <ngram occurrences="27" value="_e_" /> + <ngram occurrences="26" value="tt" /> + <ngram occurrences="26" value="o_d" /> + <ngram occurrences="26" value="no_" /> + <ngram occurrences="26" value="ne" /> + <ngram occurrences="26" value="nd" /> + <ngram occurrences="26" value="ia_" /> + <ngram occurrences="26" value="_pe" /> + <ngram occurrences="25" value="st" /> + <ngram occurrences="25" value="nt" /> + <ngram occurrences="25" value="il_" /> + <ngram occurrences="25" value="gli" /> + <ngram occurrences="25" value="gl" /> + <ngram occurrences="25" value="_il_" /> + <ngram occurrences="25" value="_il" /> + <ngram occurrences="25" value="_ch" /> + <ngram occurrences="24" value="ra_" /> + <ngram occurrences="24" value="na_" /> + <ngram occurrences="24" value="ell" /> + <ngram occurrences="24" value="_se" /> + <ngram occurrences="24" value="_de" /> + <ngram occurrences="23" value="ti" /> + <ngram occurrences="23" value="se_" /> + <ngram occurrences="23" value="qu" /> + <ngram occurrences="23" value="q" /> + <ngram occurrences="23" value="om" /> + <ngram occurrences="23" value="me" /> + <ngram occurrences="23" value="le_" /> + <ngram occurrences="23" value="io_" /> + <ngram occurrences="23" value="he_" /> + <ngram occurrences="23" value="he" /> + <ngram occurrences="23" value="che_" /> + <ngram occurrences="23" value="che" /> + <ngram occurrences="23" value="at" /> + <ngram occurrences="23" value="_qu" /> + <ngram occurrences="23" value="_q" /> + <ngram occurrences="23" value="_ca" /> + <ngram occurrences="23" value="_b" /> + <ngram occurrences="22" value="vi" /> + <ngram occurrences="22" value="un" /> + <ngram occurrences="22" value="lo" /> + <ngram occurrences="22" value="e_s" /> + <ngram occurrences="22" value="e_d" /> + <ngram occurrences="22" value="di_" /> + <ngram occurrences="22" value="ci" /> + <ngram occurrences="22" value="a_m" /> + <ngram occurrences="22" value="_un" /> + <ngram occurrences="22" value="_ma" /> + <ngram occurrences="22" value="_di_" /> + <ngram occurrences="22" value="_che_" /> + <ngram occurrences="22" value="_che" /> + <ngram occurrences="21" value="te" /> + <ngram occurrences="21" value="si_" /> + <ngram occurrences="21" value="pa" /> + <ngram occurrences="21" value="a_d" /> + <ngram occurrences="21" value="_la" /> + <ngram occurrences="20" value="z" /> + <ngram occurrences="20" value="vo" /> + <ngram occurrences="20" value="i_s" /> + <ngram occurrences="20" value="del" /> + <ngram occurrences="20" value="ava" /> + <ngram occurrences="20" value="a_i" /> + <ngram occurrences="20" value="_g" /> + <ngram occurrences="20" value="_del" /> + <ngram occurrences="19" value="ss" /> + <ngram occurrences="19" value="r_" /> + <ngram occurrences="19" value="per" /> + <ngram occurrences="19" value="a_s" /> + <ngram occurrences="19" value="_t" /> + <ngram occurrences="19" value="_si" /> + <ngram occurrences="19" value="_per" /> + <ngram occurrences="18" value="is" /> + <ngram occurrences="18" value="ev" /> + <ngram occurrences="18" value="et" /> + <ngram occurrences="18" value="es" /> + <ngram occurrences="18" value="e_c" /> + <ngram occurrences="18" value="and" /> + <ngram occurrences="18" value="_r" /> + <ngram occurrences="18" value="_no" /> + <ngram occurrences="17" value="po" /> + <ngram occurrences="17" value="hi" /> + <ngram occurrences="17" value="era" /> + <ngram occurrences="17" value="e_l" /> + <ngram occurrences="17" value="e_a" /> + <ngram occurrences="17" value="a_a" /> + <ngram occurrences="17" value="_la_" /> + <ngram occurrences="17" value="_in" /> + <ngram occurrences="16" value="ua" /> + <ngram occurrences="16" value="sc" /> + <ngram occurrences="16" value="os" /> + <ngram occurrences="16" value="o_c" /> + <ngram occurrences="16" value="ne_" /> + <ngram occurrences="16" value="li_" /> + <ngram occurrences="16" value="ie" /> + <ngram occurrences="16" value="el_" /> + <ngram occurrences="16" value="chi" /> + <ngram occurrences="16" value="_vi" /> + <ngram occurrences="16" value="_al" /> + <ngram occurrences="16" value="_a_" /> + <ngram occurrences="15" value="tto" /> + <ngram occurrences="15" value="tr" /> + <ngram occurrences="15" value="su" /> + <ngram occurrences="15" value="sa_" /> + <ngram occurrences="15" value="ro" /> + <ngram occurrences="15" value="o_s" /> + <ngram occurrences="15" value="o_a" /> + <ngram occurrences="15" value="mo" /> + <ngram occurrences="15" value="lo_" /> + <ngram occurrences="15" value="it" /> + <ngram occurrences="15" value="ic" /> + <ngram occurrences="15" value="eva" /> + <ngram occurrences="15" value="e_p" /> + <ngram occurrences="15" value="com" /> + <ngram occurrences="15" value="ava_" /> + <ngram occurrences="15" value="are" /> + <ngram occurrences="15" value="all" /> + <ngram occurrences="15" value="a_n" /> + <ngram occurrences="15" value="_su" /> + <ngram occurrences="15" value="_com" /> + <ngram occurrences="14" value="ta_" /> + <ngram occurrences="14" value="per_" /> + <ngram occurrences="14" value="on_" /> + <ngram occurrences="14" value="ndo" /> + <ngram occurrences="14" value="in_" /> + <ngram occurrences="14" value="gli_" /> + <ngram occurrences="14" value="fa" /> + <ngram occurrences="14" value="era_" /> + <ngram occurrences="14" value="er_" /> + <ngram occurrences="14" value="are_" /> + <ngram occurrences="14" value="ano_" /> + <ngram occurrences="14" value="ano" /> + <ngram occurrences="14" value="ad" /> + <ngram occurrences="14" value="ac" /> + <ngram occurrences="14" value="a_l" /> + <ngram occurrences="14" value="_per_" /> + <ngram occurrences="14" value="_in_" /> + <ngram occurrences="13" value="ur" /> + <ngram occurrences="13" value="un_" /> + <ngram occurrences="13" value="tu" /> + <ngram occurrences="13" value="tto_" /> + <ngram occurrences="13" value="te_" /> + <ngram occurrences="13" value="so" /> + <ngram occurrences="13" value="qua" /> + <ngram occurrences="13" value="oc" /> + <ngram occurrences="13" value="non" /> + <ngram occurrences="13" value="mp" /> + <ngram occurrences="13" value="mi" /> + <ngram occurrences="13" value="la_m" /> + <ngram occurrences="13" value="i_c" /> + <ngram occurrences="13" value="ella_" /> + <ngram occurrences="13" value="ella" /> + <ngram occurrences="13" value="do_" /> + <ngram occurrences="13" value="ari" /> + <ngram occurrences="13" value="a_p" /> + <ngram occurrences="13" value="_un_" /> + <ngram occurrences="13" value="_si_" /> + <ngram occurrences="13" value="_qua" /> + <ngram occurrences="13" value="_non" /> + <ngram occurrences="13" value="_do" /> + <ngram occurrences="13" value="_av" /> + <ngram occurrences="12" value="é_" /> + <ngram occurrences="12" value="é" /> + <ngram occurrences="12" value="ut" /> + <ngram occurrences="12" value="uo" /> + <ngram occurrences="12" value="ue" /> + <ngram occurrences="12" value="ti_" /> + <ngram occurrences="12" value="sse" /> + <ngram occurrences="12" value="pr" /> + <ngram occurrences="12" value="non_" /> + <ngram occurrences="12" value="ni" /> + <ngram occurrences="12" value="me_" /> + <ngram occurrences="12" value="l_a" /> + <ngram occurrences="12" value="id" /> + <ngram occurrences="12" value="i_d" /> + <ngram occurrences="12" value="i_a" /> + <ngram occurrences="12" value="eva_" /> + <ngram occurrences="12" value="da_" /> + <ngram occurrences="12" value="col" /> + <ngram occurrences="12" value="ce" /> + <ngram occurrences="12" value="be" /> + <ngram occurrences="12" value="a_e" /> + <ngram occurrences="12" value="_ve" /> + <ngram occurrences="12" value="_tu" /> + <ngram occurrences="12" value="_o" /> + <ngram occurrences="12" value="_non_" /> + <ngram occurrences="12" value="_l_" /> + <ngram occurrences="12" value="_gli_" /> + <ngram occurrences="12" value="_gli" /> + <ngram occurrences="12" value="_gl" /> + <ngram occurrences="12" value="_er" /> + <ngram occurrences="11" value="ul" /> + <ngram occurrences="11" value="pi" /> + <ngram occurrences="11" value="ome" /> + <ngram occurrences="11" value="o_i" /> + <ngram occurrences="11" value="o_e" /> + <ngram occurrences="11" value="o_di" /> + <ngram occurrences="11" value="l_p" /> + <ngram occurrences="11" value="ig" /> + <ngram occurrences="11" value="gn" /> + <ngram occurrences="11" value="fi" /> + <ngram occurrences="11" value="e_e" /> + <ngram occurrences="11" value="dd" /> + <ngram occurrences="11" value="cch" /> + <ngram occurrences="11" value="cas" /> + <ngram occurrences="11" value="ave" /> + <ngram occurrences="11" value="acc" /> + <ngram occurrences="11" value="a_v" /> + <ngram occurrences="11" value="a_ma" /> + <ngram occurrences="11" value="a_f" /> + <ngram occurrences="11" value="a_e_" /> + <ngram occurrences="11" value="a_co" /> + <ngram occurrences="11" value="_sa" /> + <ngram occurrences="11" value="_ri" /> + <ngram occurrences="11" value="_ne" /> + <ngram occurrences="11" value="_fa" /> + <ngram occurrences="11" value="_era" /> + <ngram occurrences="11" value="_da" /> + <ngram occurrences="11" value="_col" /> + <ngram occurrences="11" value="_cas" /> + <ngram occurrences="11" value="_ave" /> + <ngram occurrences="10" value="zi" /> + <ngram occurrences="10" value="rr" /> + <ngram occurrences="10" value="que" /> + <ngram occurrences="10" value="ome_" /> + <ngram occurrences="10" value="og" /> + <ngram occurrences="10" value="o_p" /> + <ngram occurrences="10" value="ndo_" /> + <ngram occurrences="10" value="n_c" /> + <ngram occurrences="10" value="man" /> + <ngram occurrences="10" value="ent" /> + <ngram occurrences="10" value="dell" /> + <ngram occurrences="10" value="cchi" /> + <ngram occurrences="10" value="casa_" /> + <ngram occurrences="10" value="casa" /> + <ngram occurrences="10" value="ato" /> + <ngram occurrences="10" value="asa_" /> + <ngram occurrences="10" value="asa" /> + <ngram occurrences="10" value="am" /> + <ngram occurrences="10" value="ale" /> + <ngram occurrences="10" value="a_di" /> + <ngram occurrences="10" value="_vo" /> + <ngram occurrences="10" value="_st" /> + <ngram occurrences="10" value="_que" /> + <ngram occurrences="10" value="_pa" /> + <ngram occurrences="10" value="_mo" /> + <ngram occurrences="10" value="_era_" /> + <ngram occurrences="10" value="_dell" /> + <ngram occurrences="10" value="_casa" /> + <ngram occurrences="10" value="_all" /> + <ngram occurrences="9" value="ó_" /> + <ngram occurrences="9" value="ó" /> + <ngram occurrences="9" value="van" /> + <ngram occurrences="9" value="uri" /> + <ngram occurrences="9" value="u_" /> + <ngram occurrences="9" value="sta" /> + <ngram occurrences="9" value="sse_" /> + <ngram occurrences="9" value="rid" /> + <ngram occurrences="9" value="par" /> + <ngram occurrences="9" value="ot" /> + <ngram occurrences="9" value="oi" /> + <ngram occurrences="9" value="o_di_" /> + <ngram occurrences="9" value="o_de" /> + <ngram occurrences="9" value="nda" /> + <ngram occurrences="9" value="iv" /> + <ngram occurrences="9" value="far" /> + <ngram occurrences="9" value="ess" /> + <ngram occurrences="9" value="e_n" /> + <ngram occurrences="9" value="e_i" /> + <ngram occurrences="9" value="del_" /> + <ngram occurrences="9" value="come_" /> + <ngram occurrences="9" value="come" /> + <ngram occurrences="9" value="bi" /> + <ngram occurrences="9" value="ato_" /> + <ngram occurrences="9" value="ando" /> + <ngram occurrences="9" value="anda" /> + <ngram occurrences="9" value="ale_" /> + <ngram occurrences="9" value="a_il_" /> + <ngram occurrences="9" value="a_il" /> + <ngram occurrences="9" value="_me" /> + <ngram occurrences="9" value="_le" /> + <ngram occurrences="9" value="_l_a" /> + <ngram occurrences="9" value="_del_" /> + <ngram occurrences="9" value="_come" /> + <ngram occurrences="9" value="_be" /> + <ngram occurrences="9" value="_an" /> + <ngram occurrences="8" value="vano_" /> + <ngram occurrences="8" value="vano" /> + <ngram occurrences="8" value="una_" /> + <ngram occurrences="8" value="una" /> + <ngram occurrences="8" value="uel" /> + <ngram occurrences="8" value="ser" /> + <ngram occurrences="8" value="ridd" /> + <ngram occurrences="8" value="ora" /> + <ngram occurrences="8" value="oi_" /> + <ngram occurrences="8" value="occ" /> + <ngram occurrences="8" value="o_l" /> + <ngram occurrences="8" value="o_e_" /> + <ngram occurrences="8" value="nz" /> + <ngram occurrences="8" value="n_ca" /> + <ngram occurrences="8" value="la_ma" /> + <ngram occurrences="8" value="la_c" /> + <ngram occurrences="8" value="ir" /> + <ngram occurrences="8" value="ina" /> + <ngram occurrences="8" value="idd" /> + <ngram occurrences="8" value="i_l" /> + <ngram occurrences="8" value="i_i" /> + <ngram occurrences="8" value="hi_" /> + <ngram occurrences="8" value="ene" /> + <ngram occurrences="8" value="e_pe" /> + <ngram occurrences="8" value="e_di" /> + <ngram occurrences="8" value="e_ch" /> +</ngrams> diff --git a/src/plugins/language/japanese-euc_jp.klp b/src/plugins/language/japanese-euc_jp.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1405" value="_" /> + <ngram occurrences="190" value="½" /> + <ngram occurrences="139" value="ë" /> + <ngram occurrences="131" value="_ë" /> + <ngram occurrences="110" value="¹" /> + <ngram occurrences="107" value="ê" /> + <ngram occurrences="107" value="_½" /> + <ngram occurrences="101" value="è" /> + <ngram occurrences="96" value="¸" /> + <ngram occurrences="96" value="ì" /> + <ngram occurrences="95" value="î" /> + <ngram occurrences="95" value="ë_" /> + <ngram occurrences="94" value="_ë_" /> + <ngram occurrences="87" value="½_" /> + <ngram occurrences="85" value="ç" /> + <ngram occurrences="85" value="_¹" /> + <ngram occurrences="83" value="í" /> + <ngram occurrences="81" value="á" /> + <ngram occurrences="76" value="æ" /> + <ngram occurrences="76" value="_è" /> + <ngram occurrences="75" value="è_" /> + <ngram occurrences="73" value="_î" /> + <ngram occurrences="72" value="_½_" /> + <ngram occurrences="68" value="ì_" /> + <ngram occurrences="67" value="_ê" /> + <ngram occurrences="66" value="ó" /> + <ngram occurrences="63" value="ã" /> + <ngram occurrences="63" value="_è_" /> + <ngram occurrences="60" value="µ" /> + <ngram occurrences="58" value="ä" /> + <ngram occurrences="57" value="ó_" /> + <ngram occurrences="57" value="ï" /> + <ngram occurrences="57" value="é" /> + <ngram occurrences="57" value="ç_" /> + <ngram occurrences="57" value="æ_" /> + <ngram occurrences="57" value="_ì" /> + <ngram occurrences="56" value="á_" /> + <ngram occurrences="56" value="_æ" /> + <ngram occurrences="55" value="_ó" /> + <ngram occurrences="53" value="ê_" /> + <ngram occurrences="53" value="µ_" /> + <ngram occurrences="52" value="â" /> + <ngram occurrences="51" value="¹_" /> + <ngram occurrences="51" value="_á" /> + <ngram occurrences="50" value="_ó_" /> + <ngram occurrences="50" value="_¹_" /> + <ngram occurrences="49" value="ã_" /> + <ngram occurrences="47" value="_¸" /> + <ngram occurrences="47" value="_ì_" /> + <ngram occurrences="47" value="_æ_" /> + <ngram occurrences="47" value="_µ" /> + <ngram occurrences="44" value="ï_" /> + <ngram occurrences="44" value="_ï" /> + <ngram occurrences="44" value="_ê_" /> + <ngram occurrences="44" value="_ç" /> + <ngram occurrences="44" value="_µ_" /> + <ngram occurrences="43" value="¸_" /> + <ngram occurrences="43" value="õ" /> + <ngram occurrences="42" value="ð" /> + <ngram occurrences="41" value="à" /> + <ngram occurrences="41" value="_ã" /> + <ngram occurrences="40" value="_á_" /> + <ngram occurrences="39" value="_ã_" /> + <ngram occurrences="38" value="í_" /> + <ngram occurrences="38" value="_é" /> + <ngram occurrences="37" value="ý" /> + <ngram occurrences="37" value="î_" /> + <ngram occurrences="37" value="å" /> + <ngram occurrences="36" value="ô" /> + <ngram occurrences="36" value="ò" /> + <ngram occurrences="36" value="_í" /> + <ngram occurrences="35" value="_ï_" /> + <ngram occurrences="34" value="õ_" /> + <ngram occurrences="34" value="é_" /> + <ngram occurrences="34" value="_ç_" /> + <ngram occurrences="32" value="ô_" /> + <ngram occurrences="32" value="ð_" /> + <ngram occurrences="31" value="_é_" /> + <ngram occurrences="30" value="ÿ" /> + <ngram occurrences="30" value="ø" /> + <ngram occurrences="30" value="³" /> + <ngram occurrences="29" value="â_" /> + <ngram occurrences="29" value="_ò" /> + <ngram occurrences="28" value="¨" /> + <ngram occurrences="28" value="þ" /> + <ngram occurrences="28" value="à_" /> + <ngram occurrences="28" value="_¸_" /> + <ngram occurrences="27" value="ö" /> + <ngram occurrences="27" value="_î_" /> + <ngram occurrences="25" value="¨_" /> + <ngram occurrences="25" value="¹_ë" /> + <ngram occurrences="25" value="_í_" /> + <ngram occurrences="25" value="_¹_ë" /> + <ngram occurrences="23" value="µ_ì" /> + <ngram occurrences="23" value="³_" /> + <ngram occurrences="23" value="_õ" /> + <ngram occurrences="23" value="_ä" /> + <ngram occurrences="23" value="_µ_ì" /> + <ngram occurrences="22" value="þ_" /> + <ngram occurrences="22" value="ñ" /> + <ngram occurrences="22" value="¹_ë_" /> + <ngram occurrences="22" value="µ_ì_" /> + <ngram occurrences="22" value="_¹_ë_" /> + <ngram occurrences="22" value="_µ_ì_" /> + <ngram occurrences="21" value="½ô" /> + <ngram occurrences="21" value="ý_" /> + <ngram occurrences="21" value="ä_" /> + <ngram occurrences="21" value="²" /> + <ngram occurrences="21" value="_õ_" /> + <ngram occurrences="21" value="_â" /> + <ngram occurrences="21" value="_³" /> + <ngram occurrences="20" value="½ô_" /> + <ngram occurrences="20" value="½_¸" /> + <ngram occurrences="20" value="ö_" /> + <ngram occurrences="20" value="ª" /> + <ngram occurrences="20" value="_½_¸" /> + <ngram occurrences="20" value="_³_" /> + <ngram occurrences="19" value="ü" /> + <ngram occurrences="19" value="ì_ë" /> + <ngram occurrences="19" value="á_ã_" /> + <ngram occurrences="19" value="á_ã" /> + <ngram occurrences="19" value="t" /> + <ngram occurrences="19" value="_ð_" /> + <ngram occurrences="19" value="_ð" /> + <ngram occurrences="18" value="µ_½" /> + <ngram occurrences="18" value="_¨" /> + <ngram occurrences="18" value="_á_ã_" /> + <ngram occurrences="18" value="_á_ã" /> + <ngram occurrences="17" value="ã_½_¸" /> + <ngram occurrences="17" value="ã_½_" /> + <ngram occurrences="17" value="ã_½" /> + <ngram occurrences="17" value="á_ã_½" /> + <ngram occurrences="17" value="_þ" /> + <ngram occurrences="17" value="_ä_" /> + <ngram occurrences="17" value="_ã_½_" /> + <ngram occurrences="17" value="_ã_½" /> + <ngram occurrences="17" value="_â_" /> + <ngram occurrences="16" value="½_ó_¹" /> + <ngram occurrences="16" value="½_ó_" /> + <ngram occurrences="16" value="½_ó" /> + <ngram occurrences="16" value="ó_¹" /> + <ngram occurrences="16" value="µ_½_ó" /> + <ngram occurrences="16" value="µ_½_" /> + <ngram occurrences="16" value="n" /> + <ngram occurrences="16" value="_¨_" /> + <ngram occurrences="16" value="_½_ó_" /> + <ngram occurrences="16" value="_½_ó" /> + <ngram occurrences="16" value="_þ_" /> + <ngram occurrences="16" value="_ó_¹" /> + <ngram occurrences="16" value="_ì_ë" /> + <ngram occurrences="16" value="_µ_½_" /> + <ngram occurrences="16" value="_µ_½" /> + <ngram occurrences="15" value="û" /> + <ngram occurrences="15" value="ë_è" /> + <ngram occurrences="15" value="ç_ë" /> + <ngram occurrences="15" value="ª_" /> + <ngram occurrences="15" value="i" /> + <ngram occurrences="15" value="_ë_è" /> + <ngram occurrences="14" value="ç_ë_" /> + <ngram occurrences="14" value="º" /> + <ngram occurrences="14" value="s" /> + <ngram occurrences="14" value="_à" /> + <ngram occurrences="13" value="½õ_" /> + <ngram occurrences="13" value="½õ" /> + <ngram occurrences="13" value="½_¸_" /> + <ngram occurrences="13" value="ø_" /> + <ngram occurrences="13" value="õ_½" /> + <ngram occurrences="13" value="ò_" /> + <ngram occurrences="13" value="íý" /> + <ngram occurrences="13" value="íñ" /> + <ngram occurrences="13" value="ë_è_" /> + <ngram occurrences="13" value="äì" /> + <ngram occurrences="13" value="d" /> + <ngram occurrences="13" value="_½_¸_" /> + <ngram occurrences="13" value="_ý" /> + <ngram occurrences="13" value="_ë_è_" /> + <ngram occurrences="12" value="é½" /> + <ngram occurrences="12" value="¹ç" /> + <ngram occurrences="12" value="a" /> + <ngram occurrences="12" value="_ø" /> + <ngram occurrences="12" value="_å" /> + <ngram occurrences="12" value="_²" /> + <ngram occurrences="12" value="_ª_" /> + <ngram occurrences="12" value="_ª" /> + <ngram occurrences="11" value="û_" /> + <ngram occurrences="11" value="ù" /> + <ngram occurrences="11" value="ì_ë_" /> + <ngram occurrences="11" value="æ_ë" /> + <ngram occurrences="11" value="ß" /> + <ngram occurrences="11" value="µ_ì_ë" /> + <ngram occurrences="11" value="_½ô_" /> + <ngram occurrences="11" value="_½ô" /> + <ngram occurrences="11" value="_ý_" /> + <ngram occurrences="10" value="½è" /> + <ngram occurrences="10" value="èí" /> + <ngram occurrences="10" value="äì_" /> + <ngram occurrences="10" value="äê" /> + <ngram occurrences="10" value="_ì_ë_" /> + <ngram occurrences="10" value="_ç_ë" /> + <ngram occurrences="10" value="_æ_ë" /> + <ngram occurrences="9" value="¸_¹" /> + <ngram occurrences="9" value="½¨_" /> + <ngram occurrences="9" value="½¨" /> + <ngram occurrences="9" value="ü_" /> + <ngram occurrences="9" value="ù_" /> + <ngram occurrences="9" value="øíñ" /> + <ngram occurrences="9" value="øí" /> + <ngram occurrences="9" value="íý_" /> + <ngram occurrences="9" value="íøíñ" /> + <ngram occurrences="9" value="íøí" /> + <ngram occurrences="9" value="íø" /> + <ngram occurrences="9" value="í_á" /> + <ngram occurrences="9" value="ë_á_" /> + <ngram occurrences="9" value="ë_á" /> + <ngram occurrences="9" value="çû" /> + <ngram occurrences="9" value="¹ç_" /> + <ngram occurrences="9" value="t_" /> + <ngram occurrences="9" value="_ô_" /> + <ngram occurrences="9" value="_ô" /> + <ngram occurrences="9" value="_ë_á_" /> + <ngram occurrences="9" value="_ë_á" /> + <ngram occurrences="9" value="_ç_ë_" /> + <ngram occurrences="8" value="¸_¹ð" /> + <ngram occurrences="8" value="½õ_½ô" /> + <ngram occurrences="8" value="½õ_½" /> + <ngram occurrences="8" value="½èíý_" /> + <ngram occurrences="8" value="½èíý" /> + <ngram occurrences="8" value="½èí" /> + <ngram occurrences="8" value="øíñ½ô" /> + <ngram occurrences="8" value="øíñ½" /> + <ngram occurrences="8" value="õ_½ô_" /> + <ngram occurrences="8" value="õ_½ô" /> + <ngram occurrences="8" value="ñ½ô_" /> + <ngram occurrences="8" value="ñ½ô" /> + <ngram occurrences="8" value="ñ½" /> + <ngram occurrences="8" value="íøíñ½" /> + <ngram occurrences="8" value="íñ½ô_" /> + <ngram occurrences="8" value="íñ½ô" /> + <ngram occurrences="8" value="íñ½" /> + <ngram occurrences="8" value="í_áç_" /> + <ngram occurrences="8" value="í_áç" /> + <ngram occurrences="8" value="ë_½" /> + <ngram occurrences="8" value="êý" /> + <ngram occurrences="8" value="ê_ë" /> + <ngram occurrences="8" value="èíý_" /> + <ngram occurrences="8" value="èíý" /> + <ngram occurrences="8" value="è_ó" /> + <ngram occurrences="8" value="ç½" /> + <ngram occurrences="8" value="æ_ë_" /> + <ngram occurrences="8" value="å_" /> + <ngram occurrences="8" value="áç_" /> + <ngram occurrences="8" value="áç" /> + <ngram occurrences="8" value="¹ð" /> + <ngram occurrences="8" value="¹í" /> + <ngram occurrences="8" value="o" /> + <ngram occurrences="8" value="_ò_" /> + <ngram occurrences="8" value="_ë_½" /> + <ngram occurrences="8" value="_è_ó" /> + <ngram occurrences="8" value="_áç_" /> + <ngram occurrences="8" value="_áç" /> + <ngram occurrences="8" value="_¹ð" /> + <ngram occurrences="7" value="¸ä" /> + <ngram occurrences="7" value="ÿ_" /> + <ngram occurrences="7" value="ó_è" /> + <ngram occurrences="7" value="ó_¹í_" /> + <ngram occurrences="7" value="ó_¹í" /> + <ngram occurrences="7" value="ñ_" /> + <ngram occurrences="7" value="ë¸" /> + <ngram occurrences="7" value="ë_½_" /> + <ngram occurrences="7" value="ê_¹_" /> + <ngram occurrences="7" value="ê_¹" /> + <ngram occurrences="7" value="é_ì_" /> + <ngram occurrences="7" value="é_ì" /> + <ngram occurrences="7" value="è_î" /> + <ngram occurrences="7" value="ç_½" /> + <ngram occurrences="7" value="ç_ï" /> + <ngram occurrences="7" value="ç_î" /> + <ngram occurrences="7" value="äê_" /> + <ngram occurrences="7" value="á_ë" /> + <ngram occurrences="7" value="º_" /> + <ngram occurrences="7" value="¹í_áç" /> + <ngram occurrences="7" value="¹í_á" /> + <ngram occurrences="7" value="¹í_" /> + <ngram occurrences="7" value="r" /> + <ngram occurrences="7" value="_ÿ" /> + <ngram occurrences="7" value="_ü" /> + <ngram occurrences="7" value="_ù" /> + <ngram occurrences="7" value="_ø_" /> + <ngram occurrences="7" value="_ó_¹í" /> + <ngram occurrences="7" value="_ë¸" /> + <ngram occurrences="7" value="_ë_½_" /> + <ngram occurrences="7" value="_ê_ë" /> + <ngram occurrences="7" value="_é_ì_" /> + <ngram occurrences="7" value="_é_ì" /> + <ngram occurrences="7" value="_æ_ë_" /> + <ngram occurrences="7" value="_å_" /> + <ngram occurrences="7" value="_à_" /> + <ngram occurrences="7" value="_ß" /> + <ngram occurrences="7" value="_º" /> + <ngram occurrences="7" value="_¹í_á" /> + <ngram occurrences="7" value="_¹í_" /> + <ngram occurrences="7" value="_¹í" /> + <ngram occurrences="6" value="¸_ë" /> + <ngram occurrences="6" value="¸_¹ð_" /> + <ngram occurrences="6" value="½½¨_" /> + <ngram occurrences="6" value="½½¨" /> + <ngram occurrences="6" value="½½" /> + <ngram occurrences="6" value="½ç" /> + <ngram occurrences="6" value="½à" /> + <ngram occurrences="6" value="½_è" /> + <ngram occurrences="6" value="ÿõâö" /> + <ngram occurrences="6" value="ÿõâ" /> + <ngram occurrences="6" value="ÿõ" /> + <ngram occurrences="6" value="õâö" /> + <ngram occurrences="6" value="õâ" /> + <ngram occurrences="6" value="õ_á_" /> + <ngram occurrences="6" value="õ_á" /> + <ngram occurrences="6" value="ó_æ_" /> + <ngram occurrences="6" value="ó_æ" /> + <ngram occurrences="6" value="ó_¹_" /> + <ngram occurrences="6" value="î½" /> + <ngram occurrences="6" value="í_è" /> + <ngram occurrences="6" value="í_µ" /> + <ngram occurrences="6" value="ì_½" /> + <ngram occurrences="6" value="ì_æ" /> + <ngram occurrences="6" value="ì_¹" /> + <ngram occurrences="6" value="ë_ç" /> + <ngram occurrences="6" value="êì" /> + <ngram occurrences="6" value="é½½¨_" /> + <ngram occurrences="6" value="é½½¨" /> + <ngram occurrences="6" value="é½½" /> + <ngram occurrences="6" value="é_ð_" /> + <ngram occurrences="6" value="é_ð" /> + <ngram occurrences="6" value="ç_¸_" /> + <ngram occurrences="6" value="ç_¸" /> + <ngram occurrences="6" value="ç_ï_" /> + <ngram occurrences="6" value="âö" /> + <ngram occurrences="6" value="ß_" /> + <ngram occurrences="6" value="¹½" /> + <ngram occurrences="6" value="¹ð_" /> + <ngram occurrences="6" value="¹_è_" /> + <ngram occurrences="6" value="¹_è" /> + <ngram occurrences="6" value="µ_æ_" /> + <ngram occurrences="6" value="µ_æ" /> + <ngram occurrences="6" value="³_î" /> + <ngram occurrences="6" value="u" /> + <ngram occurrences="6" value="g" /> + <ngram occurrences="6" value="_½è" /> + <ngram occurrences="6" value="_ù_" /> + <ngram occurrences="6" value="_ö" /> + <ngram occurrences="6" value="_õ_á_" /> + <ngram occurrences="6" value="_õ_á" /> + <ngram occurrences="6" value="_ó_è" /> + <ngram occurrences="6" value="_ó_æ_" /> + <ngram occurrences="6" value="_ó_æ" /> + <ngram occurrences="6" value="_ó_¹_" /> + <ngram occurrences="6" value="_î½" /> + <ngram occurrences="6" value="_ë_ç" /> + <ngram occurrences="6" value="_é_ð_" /> + <ngram occurrences="6" value="_é_ð" /> + <ngram occurrences="6" value="_è_î" /> + <ngram occurrences="6" value="_¹ð_" /> + <ngram occurrences="6" value="_¹_è_" /> + <ngram occurrences="6" value="_¹_è" /> + <ngram occurrences="5" value="¸½" /> + <ngram occurrences="5" value="¸ø" /> + <ngram occurrences="5" value="¸ö" /> + <ngram occurrences="5" value="¸äì_½" /> + <ngram occurrences="5" value="¸äì_" /> + <ngram occurrences="5" value="¸äì" /> + <ngram occurrences="5" value="¸_ë_" /> + <ngram occurrences="5" value="½ê" /> + <ngram occurrences="5" value="½à_" /> + <ngram occurrences="5" value="½_¸äì" /> + <ngram occurrences="5" value="½_¸ä" /> + <ngram occurrences="5" value="½_ð_ã" /> + <ngram occurrences="5" value="½_ð_" /> + <ngram occurrences="5" value="½_ð" /> + <ngram occurrences="5" value="½_î" /> + <ngram occurrences="5" value="ý¸" /> + <ngram occurrences="5" value="ý_ó_" /> + <ngram occurrences="5" value="ý_ó" /> + <ngram occurrences="5" value="û_ê_" /> + <ngram occurrences="5" value="û_ê" /> + <ngram occurrences="5" value="ú" /> + <ngram occurrences="5" value="øäê_" /> + <ngram occurrences="5" value="øäê" /> + <ngram occurrences="5" value="øä" /> + <ngram occurrences="5" value="õ_½_" /> + <ngram occurrences="5" value="ô_î" /> + <ngram occurrences="5" value="ó_è_" /> + <ngram occurrences="5" value="ð_í_" /> + <ngram occurrences="5" value="ð_í" /> + <ngram occurrences="5" value="ð_æ" /> + <ngram occurrences="5" value="ð_ã_" /> + <ngram occurrences="5" value="ð_ã" /> + <ngram occurrences="5" value="ï_½" /> + <ngram occurrences="5" value="ï_ê" /> + <ngram occurrences="5" value="í_è_" /> + <ngram occurrences="5" value="ì_½èí" /> +</ngrams> diff --git a/src/plugins/language/japanese-shift_jis.klp b/src/plugins/language/japanese-shift_jis.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1870" value="_" /> + <ngram occurrences="112" value="ì_" /> + <ngram occurrences="112" value="ì" /> + <ngram occurrences="112" value="_ì_" /> + <ngram occurrences="112" value="_ì" /> + <ngram occurrences="106" value="é_" /> + <ngram occurrences="106" value="é" /> + <ngram occurrences="106" value="_é_" /> + <ngram occurrences="106" value="_é" /> + <ngram occurrences="96" value="a_" /> + <ngram occurrences="96" value="a" /> + <ngram occurrences="96" value="_a_" /> + <ngram occurrences="96" value="_a" /> + <ngram occurrences="92" value="è_" /> + <ngram occurrences="92" value="è" /> + <ngram occurrences="92" value="_è_" /> + <ngram occurrences="92" value="_è" /> + <ngram occurrences="85" value="æ_" /> + <ngram occurrences="85" value="æ" /> + <ngram occurrences="85" value="_æ_" /> + <ngram occurrences="85" value="_æ" /> + <ngram occurrences="73" value="ð_" /> + <ngram occurrences="73" value="ð" /> + <ngram occurrences="73" value="_ð_" /> + <ngram occurrences="73" value="_ð" /> + <ngram occurrences="67" value="½_" /> + <ngram occurrences="67" value="½" /> + <ngram occurrences="67" value="å_" /> + <ngram occurrences="67" value="å" /> + <ngram occurrences="67" value="_½_" /> + <ngram occurrences="67" value="_½" /> + <ngram occurrences="67" value="_å_" /> + <ngram occurrences="67" value="_å" /> + <ngram occurrences="55" value="í_" /> + <ngram occurrences="55" value="í" /> + <ngram occurrences="55" value="ä_" /> + <ngram occurrences="55" value="ä" /> + <ngram occurrences="55" value="_í_" /> + <ngram occurrences="55" value="_í" /> + <ngram occurrences="55" value="_ä_" /> + <ngram occurrences="55" value="_ä" /> + <ngram occurrences="52" value="µ_" /> + <ngram occurrences="52" value="µ" /> + <ngram occurrences="52" value="b_" /> + <ngram occurrences="52" value="b" /> + <ngram occurrences="52" value="_µ_" /> + <ngram occurrences="52" value="_µ" /> + <ngram occurrences="52" value="_b_" /> + <ngram occurrences="52" value="_b" /> + <ngram occurrences="48" value="ç_" /> + <ngram occurrences="48" value="ç" /> + <ngram occurrences="48" value="_ç_" /> + <ngram occurrences="48" value="_ç" /> + <ngram occurrences="47" value="ü_" /> + <ngram occurrences="47" value="ü" /> + <ngram occurrences="47" value="à_" /> + <ngram occurrences="47" value="à" /> + <ngram occurrences="47" value="_ü_" /> + <ngram occurrences="47" value="_ü" /> + <ngram occurrences="47" value="_à_" /> + <ngram occurrences="47" value="_à" /> + <ngram occurrences="43" value="v_" /> + <ngram occurrences="43" value="v" /> + <ngram occurrences="43" value="_v_" /> + <ngram occurrences="43" value="_v" /> + <ngram occurrences="41" value="ª_" /> + <ngram occurrences="41" value="ª" /> + <ngram occurrences="41" value="_ª_" /> + <ngram occurrences="41" value="_ª" /> + <ngram occurrences="36" value="n_" /> + <ngram occurrences="36" value="n" /> + <ngram occurrences="36" value="_n_" /> + <ngram occurrences="36" value="_n" /> + <ngram occurrences="34" value="ê_" /> + <ngram occurrences="34" value="ê" /> + <ngram occurrences="34" value="_ê_" /> + <ngram occurrences="34" value="_ê" /> + <ngram occurrences="30" value="i_" /> + <ngram occurrences="30" value="i" /> + <ngram occurrences="30" value="_i_" /> + <ngram occurrences="30" value="_i" /> + <ngram occurrences="28" value="x_" /> + <ngram occurrences="28" value="x" /> + <ngram occurrences="28" value="_x_" /> + <ngram occurrences="28" value="_x" /> + <ngram occurrences="27" value="á_" /> + <ngram occurrences="27" value="á" /> + <ngram occurrences="27" value="_á_" /> + <ngram occurrences="27" value="_á" /> + <ngram occurrences="26" value="û_" /> + <ngram occurrences="26" value="û" /> + <ngram occurrences="26" value="w_" /> + <ngram occurrences="26" value="w" /> + <ngram occurrences="26" value="_û_" /> + <ngram occurrences="26" value="_û" /> + <ngram occurrences="26" value="_w_" /> + <ngram occurrences="26" value="_w" /> + <ngram occurrences="25" value="p_" /> + <ngram occurrences="25" value="p" /> + <ngram occurrences="25" value="_p_" /> + <ngram occurrences="25" value="_p" /> + <ngram occurrences="23" value="s_" /> + <ngram occurrences="23" value="s" /> + <ngram occurrences="23" value="_s_" /> + <ngram occurrences="23" value="_s" /> + <ngram occurrences="21" value="ñ_" /> + <ngram occurrences="21" value="ñ" /> + <ngram occurrences="21" value="o_" /> + <ngram occurrences="21" value="o" /> + <ngram occurrences="21" value="_ñ_" /> + <ngram occurrences="21" value="_ñ" /> + <ngram occurrences="21" value="_o_" /> + <ngram occurrences="21" value="_o" /> + <ngram occurrences="20" value="µ_ä_" /> + <ngram occurrences="20" value="µ_ä" /> + <ngram occurrences="20" value="_µ_ä_" /> + <ngram occurrences="20" value="_µ_ä" /> + <ngram occurrences="18" value="â_" /> + <ngram occurrences="18" value="â" /> + <ngram occurrences="18" value="_â_" /> + <ngram occurrences="18" value="_â" /> + <ngram occurrences="17" value="ß_" /> + <ngram occurrences="17" value="ß" /> + <ngram occurrences="17" value="³_" /> + <ngram occurrences="17" value="³" /> + <ngram occurrences="17" value="z_" /> + <ngram occurrences="17" value="z" /> + <ngram occurrences="17" value="l_" /> + <ngram occurrences="17" value="l" /> + <ngram occurrences="17" value="j_" /> + <ngram occurrences="17" value="j" /> + <ngram occurrences="17" value="_ß_" /> + <ngram occurrences="17" value="_ß" /> + <ngram occurrences="17" value="_³_" /> + <ngram occurrences="17" value="_³" /> + <ngram occurrences="17" value="_z_" /> + <ngram occurrences="17" value="_z" /> + <ngram occurrences="17" value="_l_" /> + <ngram occurrences="17" value="_l" /> + <ngram occurrences="17" value="_j_" /> + <ngram occurrences="17" value="_j" /> + <ngram occurrences="16" value="¨_" /> + <ngram occurrences="16" value="¨" /> + <ngram occurrences="16" value="ÿ_" /> + <ngram occurrences="16" value="ÿ" /> + <ngram occurrences="16" value="é_æ_" /> + <ngram occurrences="16" value="é_æ" /> + <ngram occurrences="16" value="u_" /> + <ngram occurrences="16" value="u" /> + <ngram occurrences="16" value="_¨_" /> + <ngram occurrences="16" value="_¨" /> + <ngram occurrences="16" value="_ÿ_" /> + <ngram occurrences="16" value="_ÿ" /> + <ngram occurrences="16" value="_é_æ_" /> + <ngram occurrences="16" value="_é_æ" /> + <ngram occurrences="16" value="_u_" /> + <ngram occurrences="16" value="_u" /> + <ngram occurrences="15" value="ï_" /> + <ngram occurrences="15" value="ï" /> + <ngram occurrences="15" value="r_" /> + <ngram occurrences="15" value="r" /> + <ngram occurrences="15" value="q_" /> + <ngram occurrences="15" value="q" /> + <ngram occurrences="15" value="_ï_" /> + <ngram occurrences="15" value="_ï" /> + <ngram occurrences="15" value="_r_" /> + <ngram occurrences="15" value="_r" /> + <ngram occurrences="15" value="_q_" /> + <ngram occurrences="15" value="_q" /> + <ngram occurrences="14" value="ü_b_" /> + <ngram occurrences="14" value="ü_b" /> + <ngram occurrences="14" value="g_" /> + <ngram occurrences="14" value="g" /> + <ngram occurrences="14" value="_ü_b_" /> + <ngram occurrences="14" value="_ü_b" /> + <ngram occurrences="14" value="_g_" /> + <ngram occurrences="14" value="_g" /> + <ngram occurrences="13" value="ú_" /> + <ngram occurrences="13" value="ú" /> + <ngram occurrences="13" value="_ú_" /> + <ngram occurrences="13" value="_ú" /> + <ngram occurrences="12" value="¸_" /> + <ngram occurrences="12" value="¸" /> + <ngram occurrences="12" value="½_b_" /> + <ngram occurrences="12" value="½_b" /> + <ngram occurrences="12" value="µ_½_" /> + <ngram occurrences="12" value="µ_½" /> + <ngram occurrences="12" value="t_" /> + <ngram occurrences="12" value="t" /> + <ngram occurrences="12" value="h_" /> + <ngram occurrences="12" value="h" /> + <ngram occurrences="12" value="c_" /> + <ngram occurrences="12" value="c" /> + <ngram occurrences="12" value="_¸_" /> + <ngram occurrences="12" value="_¸" /> + <ngram occurrences="12" value="_½_b_" /> + <ngram occurrences="12" value="_½_b" /> + <ngram occurrences="12" value="_µ_½_" /> + <ngram occurrences="12" value="_µ_½" /> + <ngram occurrences="12" value="_t_" /> + <ngram occurrences="12" value="_t" /> + <ngram occurrences="12" value="_h_" /> + <ngram occurrences="12" value="_h" /> + <ngram occurrences="12" value="_c_" /> + <ngram occurrences="12" value="_c" /> + <ngram occurrences="11" value="ã_" /> + <ngram occurrences="11" value="ã" /> + <ngram occurrences="11" value="¹_" /> + <ngram occurrences="11" value="¹" /> + <ngram occurrences="11" value="k_" /> + <ngram occurrences="11" value="k" /> + <ngram occurrences="11" value="d_" /> + <ngram occurrences="11" value="d" /> + <ngram occurrences="11" value="_ã_" /> + <ngram occurrences="11" value="_ã" /> + <ngram occurrences="11" value="_¹_" /> + <ngram occurrences="11" value="_¹" /> + <ngram occurrences="11" value="_k_" /> + <ngram occurrences="11" value="_k" /> + <ngram occurrences="11" value="_d_" /> + <ngram occurrences="11" value="_d" /> + <ngram occurrences="10" value="î_" /> + <ngram occurrences="10" value="î" /> + <ngram occurrences="10" value="ë_" /> + <ngram occurrences="10" value="ë" /> + <ngram occurrences="10" value="è_ü_" /> + <ngram occurrences="10" value="è_ü" /> + <ngram occurrences="10" value="æ_ì_" /> + <ngram occurrences="10" value="æ_ì" /> + <ngram occurrences="10" value="å_é_" /> + <ngram occurrences="10" value="å_é" /> + <ngram occurrences="10" value="ä_a_" /> + <ngram occurrences="10" value="ä_a" /> + <ngram occurrences="10" value="y_" /> + <ngram occurrences="10" value="y" /> + <ngram occurrences="10" value="_î_" /> + <ngram occurrences="10" value="_î" /> + <ngram occurrences="10" value="_ë_" /> + <ngram occurrences="10" value="_ë" /> + <ngram occurrences="10" value="_è_ü_" /> + <ngram occurrences="10" value="_è_ü" /> + <ngram occurrences="10" value="_æ_ì_" /> + <ngram occurrences="10" value="_æ_ì" /> + <ngram occurrences="10" value="_å_é_" /> + <ngram occurrences="10" value="_å_é" /> + <ngram occurrences="10" value="_ä_a_" /> + <ngram occurrences="10" value="_ä_a" /> + <ngram occurrences="10" value="_y_" /> + <ngram occurrences="10" value="_y" /> + <ngram occurrences="10" value="__" /> + <ngram occurrences="9" value="ý_" /> + <ngram occurrences="9" value="ý" /> + <ngram occurrences="9" value="ü_v_" /> + <ngram occurrences="9" value="ü_v" /> + <ngram occurrences="9" value="í_a_" /> + <ngram occurrences="9" value="í_a" /> + <ngram occurrences="9" value="á_½_" /> + <ngram occurrences="9" value="á_½" /> + <ngram occurrences="9" value="á_ä_" /> + <ngram occurrences="9" value="á_ä" /> + <ngram occurrences="9" value="º_" /> + <ngram occurrences="9" value="º" /> + <ngram occurrences="9" value="e_" /> + <ngram occurrences="9" value="e" /> + <ngram occurrences="9" value="a_ì_" /> + <ngram occurrences="9" value="a_ì" /> + <ngram occurrences="9" value="_ý_" /> + <ngram occurrences="9" value="_ý" /> + <ngram occurrences="9" value="_ü_v_" /> + <ngram occurrences="9" value="_ü_v" /> + <ngram occurrences="9" value="_í_a_" /> + <ngram occurrences="9" value="_í_a" /> + <ngram occurrences="9" value="_á_½_" /> + <ngram occurrences="9" value="_á_½" /> + <ngram occurrences="9" value="_á_ä_" /> + <ngram occurrences="9" value="_á_ä" /> + <ngram occurrences="9" value="_º_" /> + <ngram occurrences="9" value="_º" /> + <ngram occurrences="9" value="_e_" /> + <ngram occurrences="9" value="_e" /> + <ngram occurrences="9" value="_a_ì_" /> + <ngram occurrences="9" value="_a_ì" /> + <ngram occurrences="8" value="ø_" /> + <ngram occurrences="8" value="ø" /> + <ngram occurrences="8" value="ö_" /> + <ngram occurrences="8" value="ö" /> + <ngram occurrences="8" value="é_a_" /> + <ngram occurrences="8" value="é_a" /> + <ngram occurrences="8" value="è_è_" /> + <ngram occurrences="8" value="è_è" /> + <ngram occurrences="8" value="v_æ_" /> + <ngram occurrences="8" value="v_æ" /> + <ngram occurrences="8" value="_ø_" /> + <ngram occurrences="8" value="_ø" /> + <ngram occurrences="8" value="_ö_" /> + <ngram occurrences="8" value="_ö" /> + <ngram occurrences="8" value="_é_a_" /> + <ngram occurrences="8" value="_é_a" /> + <ngram occurrences="8" value="_è_è_" /> + <ngram occurrences="8" value="_è_è" /> + <ngram occurrences="8" value="_v_æ_" /> + <ngram occurrences="8" value="_v_æ" /> + <ngram occurrences="7" value="ì_ì_" /> + <ngram occurrences="7" value="ì_ì" /> + <ngram occurrences="7" value="é_à_" /> + <ngram occurrences="7" value="é_à" /> + <ngram occurrences="7" value="æ_é_" /> + <ngram occurrences="7" value="æ_é" /> + <ngram occurrences="7" value="æ_µ_" /> + <ngram occurrences="7" value="æ_µ" /> + <ngram occurrences="7" value="µ_ä_a" /> + <ngram occurrences="7" value="n_û_" /> + <ngram occurrences="7" value="n_û" /> + <ngram occurrences="7" value="_ì_ì_" /> + <ngram occurrences="7" value="_ì_ì" /> + <ngram occurrences="7" value="_é_à_" /> + <ngram occurrences="7" value="_é_à" /> + <ngram occurrences="7" value="_æ_é_" /> + <ngram occurrences="7" value="_æ_é" /> + <ngram occurrences="7" value="_æ_µ_" /> + <ngram occurrences="7" value="_æ_µ" /> + <ngram occurrences="7" value="_n_û_" /> + <ngram occurrences="7" value="_n_û" /> + <ngram occurrences="6" value="ù_" /> + <ngram occurrences="6" value="ù" /> + <ngram occurrences="6" value="ó_" /> + <ngram occurrences="6" value="ó" /> + <ngram occurrences="6" value="é_í_" /> + <ngram occurrences="6" value="é_í" /> + <ngram occurrences="6" value="é_b_" /> + <ngram occurrences="6" value="é_b" /> + <ngram occurrences="6" value="è_ü_b" /> + <ngram occurrences="6" value="æ_è_" /> + <ngram occurrences="6" value="æ_è" /> + <ngram occurrences="6" value="æ_æ_" /> + <ngram occurrences="6" value="æ_æ" /> + <ngram occurrences="6" value="æ_à_" /> + <ngram occurrences="6" value="æ_à" /> + <ngram occurrences="6" value="æ_µ_ä" /> + <ngram occurrences="6" value="å_à_" /> + <ngram occurrences="6" value="å_à" /> + <ngram occurrences="6" value="å_a_" /> + <ngram occurrences="6" value="å_a" /> + <ngram occurrences="6" value="ä_½_" /> + <ngram occurrences="6" value="ä_½" /> + <ngram occurrences="6" value="à_è_" /> + <ngram occurrences="6" value="à_è" /> + <ngram occurrences="6" value="ß_é_" /> + <ngram occurrences="6" value="ß_é" /> + <ngram occurrences="6" value="²_" /> + <ngram occurrences="6" value="²" /> + <ngram occurrences="6" value="ª_a_" /> + <ngram occurrences="6" value="ª_a" /> + <ngram occurrences="6" value="i_è_" /> + <ngram occurrences="6" value="i_è" /> + <ngram occurrences="6" value="_ù_" /> + <ngram occurrences="6" value="_ù" /> + <ngram occurrences="6" value="_ó_" /> + <ngram occurrences="6" value="_ó" /> + <ngram occurrences="6" value="_é_í_" /> + <ngram occurrences="6" value="_é_í" /> + <ngram occurrences="6" value="_é_b_" /> + <ngram occurrences="6" value="_é_b" /> + <ngram occurrences="6" value="_æ_è_" /> + <ngram occurrences="6" value="_æ_è" /> + <ngram occurrences="6" value="_æ_æ_" /> + <ngram occurrences="6" value="_æ_æ" /> + <ngram occurrences="6" value="_æ_à_" /> + <ngram occurrences="6" value="_æ_à" /> + <ngram occurrences="6" value="_å_à_" /> + <ngram occurrences="6" value="_å_à" /> + <ngram occurrences="6" value="_å_a_" /> + <ngram occurrences="6" value="_å_a" /> + <ngram occurrences="6" value="_ä_½_" /> + <ngram occurrences="6" value="_ä_½" /> + <ngram occurrences="6" value="_à_è_" /> + <ngram occurrences="6" value="_à_è" /> + <ngram occurrences="6" value="_ß_é_" /> + <ngram occurrences="6" value="_ß_é" /> + <ngram occurrences="6" value="_²_" /> + <ngram occurrences="6" value="_²" /> + <ngram occurrences="6" value="_ª_a_" /> + <ngram occurrences="6" value="_ª_a" /> + <ngram occurrences="6" value="_i_è_" /> + <ngram occurrences="6" value="_i_è" /> + <ngram occurrences="5" value="½_è_" /> + <ngram occurrences="5" value="½_è" /> + <ngram occurrences="5" value="½_µ_" /> + <ngram occurrences="5" value="½_µ" /> + <ngram occurrences="5" value="û_ª_" /> + <ngram occurrences="5" value="û_ª" /> + <ngram occurrences="5" value="õ_" /> + <ngram occurrences="5" value="õ" /> + <ngram occurrences="5" value="ô_" /> + <ngram occurrences="5" value="ô" /> + <ngram occurrences="5" value="ð_µ_" /> + <ngram occurrences="5" value="ð_µ" /> + <ngram occurrences="5" value="ì_é_" /> + <ngram occurrences="5" value="ì_é" /> + <ngram occurrences="5" value="ì_å_" /> +</ngrams> diff --git a/src/plugins/language/katlanguagemanager.cpp b/src/plugins/language/katlanguagemanager.cpp @@ -0,0 +1,310 @@ +/*************************************************************************** + * Copyright (C) 2005 by Roberto Cappuccio and the Kat team * + * Roberto Cappuccio : roberto.cappuccio@gmail.com * + * * + * This program is free software; you can redistribute it and/or modify * + * it under the terms of the GNU General Public License as published by * + * the Free Software Foundation; either version 2 of the License, or * + * (at your option) any later version. * + * * + * This program is distributed in the hope that it will be useful, * + * but WITHOUT ANY WARRANTY; without even the implied warranty of * + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * + * GNU General Public License for more details. * + * * + * You should have received a copy of the GNU General Public License * + * along with this program; if not, write to the * + * Free Software Foundation, Inc., * + * 51 Franklin Steet, Fifth Floor, Boston, MA 02110-1301, USA. * + ***************************************************************************/ + +#include <cstdlib> +#include <kdebug.h> +#include <kstandarddirs.h> +#include <kio/job.h> +#include <kio/jobclasses.h> +#include <qregexp.h> +#include <qdir.h> +#include <qdom.h> + +#include "katlanguagemanager.h" + +int NGramsList::compareItems( QCollection::Item item1, QCollection::Item item2 ) +{ + NGram* n1 = (NGram*)item1; + NGram* n2 = (NGram*)item2; + + return n2->occurrences - n1->occurrences; +} + +int LanguageList::compareItems( QCollection::Item item1, QCollection::Item item2 ) +{ + Language* n1 = (Language*)item1; + Language* n2 = (Language*)item2; + + return n2->distance - n1->distance; +} + +KatLanguageManager::KatLanguageManager() +{ +} + +KatLanguageManager::~KatLanguageManager() +{ +} + +void KatLanguageManager::extractNGrams( const QString& str, QStringList& ngrams, int size ) +{ + QString paddedString( str ); + + paddedString = paddedString.replace( QRegExp( " " ), "_" ); + paddedString = '_' + paddedString + '_'; + + for( int i = 0; i < paddedString.length() - size + 1; i++ ) + ngrams.append( paddedString.mid( i, size ) ); +} + +NGramsList KatLanguageManager::createFingerprintFromFile( const QString& fileName ) +{ + QFile m_file( fileName ); + QTextStream m_stream( &m_file ); + bool m_open = m_file.open( IO_ReadOnly ); + QString buffer = m_stream.read(); + m_file.close(); + + buffer = buffer.lower(); + buffer = buffer.replace( QRegExp( "[\\W]" ), " " ); + buffer = buffer.replace( QRegExp( "[0-9]" ), " " ); + buffer = buffer.simplifyWhiteSpace(); + + return createFingerprintFromQString( buffer ); +} + +NGramsList KatLanguageManager::createFingerprintFromQString( const QString& buf ) +{ + QStringList ngrams; + NGramsList wngrams; + + wngrams.setAutoDelete( true ); + + QString buffer( buf ); + buffer.truncate( MAXDOCSIZE ); // only use the first MAXDOCSIZE characters of the buffer + + // extract the ngrams + for ( int size = 1; size <= MAXNGRAMSIZE; ++size ) + extractNGrams( buffer, ngrams, size ); + + // sort the ngrams + ngrams.sort(); + + // count the occurrences of every ngram + // and build the NGramList wngrams + long occurrences; + QStringList::Iterator ngram = ngrams.begin(); + while ( ngram != ngrams.end() ) + { + QString currentNGram = *ngram; + + ngram++; + + occurrences = 1; + while ( *ngram == currentNGram ) + { + occurrences++; + ngram++; + } + + wngrams.inSort( new NGram( currentNGram, occurrences ) ); + } + + // the profile has to contain a maximum of MAXNGRAMS + while ( wngrams.count() > MAXNGRAMS ) + wngrams.removeLast(); + + return wngrams; +} + +QString KatLanguageManager::identifyLanguage( const QString& buffer, LanguageProfileMap lp ) +{ + long distance; + long minscore = MAXSCORE; + long threshold = minscore; + LanguageList language_list; + language_list.setAutoDelete( true ); + LanguageList candidates; + candidates.setAutoDelete( true ); + + // create the fingerprint of the buffer + NGramsList file_ngrams = createFingerprintFromQString( buffer ); + if ( buffer.length() < MINDOCSIZE ) + return QString( "unknown" ); + + // cycle through the list of managed languages + // and build an ordered list of languages sorted by distance + QMap<QString,LanguageProfile>::Iterator end( lp.end() ); + for ( QMap<QString,LanguageProfile>::Iterator it = lp.begin(); it != end; ++it ) + { + QString lname = it.key(); + LanguageProfile language_ngrams = (LanguageProfile)it.data(); + + // calculate the distance between the file profile and the language profile + distance = calculateDistance( file_ngrams, language_ngrams ); + + // calculate the threshold + if ( distance < minscore ) + { + minscore = distance; + threshold = (long)( (double)distance * THRESHOLDVALUE ); + } + + language_list.inSort( new Language( lname, distance ) ); + } + + // now that the list of languages is sorted by distance + // extract at most MAXCANDIDATES candidates + int cnt = 0; + Language* currentLanguage; + QPtrList<Language>::Iterator language = language_list.begin(); + while ( language != language_list.end() ) + { + currentLanguage = *language; + + if ( currentLanguage->distance <= threshold ) + { + cnt++; + if ( cnt == MAXCANDIDATES + 1 ) + break; + + candidates.inSort( new Language( currentLanguage->language, currentLanguage->distance ) ); + } + + language++; + } + + // If more than MAXCANDIDATES matches are found within the threshold, + // the classifier reports unknown, because the input is obviously confusing + if ( cnt == MAXCANDIDATES + 1 ) { + return QString( "unknown" ); + } else { + Language* first = candidates.getFirst(); + if ( first != 0L ) + return QString( first->language ); + else + return QString( "unknown" ); + } +} + +long KatLanguageManager::calculateDistance( NGramsList& file_ngrams, LanguageProfile& langNG ) +{ + long fileNGPos = 0L; + long langNGPos = 0L; + long distance = 0L; + + NGramsList::Iterator file_ngram = file_ngrams.begin(); + while ( file_ngram != file_ngrams.end() ) + { + NGram* currentFileNGram = *file_ngram; + + // search the currentFileNGram in language_ngrams + // and calculate the distance + QMap<QString, long>::iterator ng = langNG.find( currentFileNGram->ngram ); + + if ( ng == langNG.end() ) + { + // not found + distance = distance + MAXOUTOFPLACE; + } + else + { + //found + langNGPos = ng.data(); + distance = distance + labs( langNGPos - fileNGPos ); + } + + fileNGPos++; + file_ngram++; + } + + return distance; +} + +LanguageProfileMap* KatLanguageManager::loadAllLanguageProfiles() +{ + LanguageProfileMap* lp = new LanguageProfileMap(); + + // clear the language profile + lp->clear(); + + // find the Kat application data path + QStringList m_languageFiles = KGlobal::dirs()->findAllResources( "data", "kat/language/*.klp", false, true ); + + //delete files have .klpd extension + QStringList deletedLanguageList = KGlobal::dirs()->findAllResources( "data", "kat/language/*.klpd", false, true ); + QStringList deletedFileLanguage; + QStringList::Iterator end( deletedLanguageList.end() ); + for ( QStringList::Iterator it = deletedLanguageList.begin(); it != end; ++it ) + { + KURL file( *it ); + QString tmp = file.filename().mid( 0, file.filename().length() - 5 ); + kdDebug() << "loadAllLanguageProfiles tmp :" << tmp << endl; + deletedFileLanguage.append( tmp ); + } + // load the language profiles + QStringList::Iterator endLang( m_languageFiles.end() ); + for ( QStringList::Iterator it = m_languageFiles.begin(); it != endLang; ++it ) + { + QString lname = (*it).mid( 0, (*it).length()-4 ); + KURL tmpFile( *it ); + QString tmp = tmpFile.filename().mid( 0, tmpFile.filename().length() - 4 ); + //it was removed => don't load it + if ( deletedFileLanguage.contains( tmp ) ) + continue; + + QString profilePath = *it ; + QDomDocument doc( profilePath ); + + QFile file( profilePath ); + if ( !file.exists() ) + return lp; + + if ( !file.open( IO_ReadOnly ) ) + { + kdDebug() << "Impossible to open " << profilePath << endl; + return lp; + } + QByteArray m_data = file.readAll(); + + QString qs; + if ( !doc.setContent( QString( m_data ).utf8(), &qs ) ) + { + kdDebug() << "Impossible to set content from " << profilePath << " ERROR: " << qs << endl; + file.close(); + return lp; + } + file.close(); + + // create the list of ngrams of the language profile + LanguageProfile lprofile; + lprofile.clear(); + QDomElement docElem = doc.documentElement(); + QDomNode n = docElem.firstChild(); + long index = 0L; + + while( !n.isNull() ) + { + QDomElement e = n.toElement(); + if( !e.isNull() ) + lprofile.insert( QString( e.attribute( "value" ) ), index ); + + index++; + n = n.nextSibling(); + } + + QString tmpLang = tmpFile.filename().mid( 0, tmpFile.filename().length() - 4 ); + //kdDebug() << " language insert :" << tmpLang << endl; + lp->insert( tmpLang , lprofile ); + } + + return lp; +} + diff --git a/src/plugins/language/korean.klp b/src/plugins/language/korean.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1074" value="_" /> + <ngram occurrences="347" value="¸" /> + <ngram occurrences="302" value="à" /> + <ngram occurrences="225" value="ç" /> + <ngram occurrences="129" value="µ" /> + <ngram occurrences="129" value="_à" /> + <ngram occurrences="127" value="½" /> + <ngram occurrences="108" value="_¸" /> + <ngram occurrences="107" value="á" /> + <ngram occurrences="93" value="ã" /> + <ngram occurrences="90" value="º" /> + <ngram occurrences="89" value="ù" /> + <ngram occurrences="85" value="_ç" /> + <ngram occurrences="83" value="â" /> + <ngram occurrences="82" value="î" /> + <ngram occurrences="78" value="¸_" /> + <ngram occurrences="78" value="ö" /> + <ngram occurrences="78" value="ì" /> + <ngram occurrences="74" value="³" /> + <ngram occurrences="73" value="ÿ" /> + <ngram occurrences="71" value="¹" /> + <ngram occurrences="68" value="ø" /> + <ngram occurrences="67" value="æ" /> + <ngram occurrences="66" value="¸ù" /> + <ngram occurrences="66" value="ù_" /> + <ngram occurrences="65" value="ç_" /> + <ngram occurrences="65" value="àì" /> + <ngram occurrences="64" value="è" /> + <ngram occurrences="63" value="_½" /> + <ngram occurrences="62" value="í" /> + <ngram occurrences="62" value="_á" /> + <ngram occurrences="59" value="ï" /> + <ngram occurrences="58" value="å" /> + <ngram occurrences="56" value="ë" /> + <ngram occurrences="53" value="¸ù_" /> + <ngram occurrences="50" value="_³" /> + <ngram occurrences="49" value="â_" /> + <ngram occurrences="48" value="ì_" /> + <ngram occurrences="48" value="é" /> + <ngram occurrences="48" value="_í" /> + <ngram occurrences="48" value="_ã" /> + <ngram occurrences="46" value="à_" /> + <ngram occurrences="44" value="½_" /> + <ngram occurrences="44" value="í_" /> + <ngram occurrences="44" value="_µ" /> + <ngram occurrences="42" value="ú" /> + <ngram occurrences="41" value="_¹" /> + <ngram occurrences="40" value="ñ" /> + <ngram occurrences="40" value="î_" /> + <ngram occurrences="40" value="àì_" /> + <ngram occurrences="40" value="àç" /> + <ngram occurrences="37" value="µ_" /> + <ngram occurrences="37" value="_í_" /> + <ngram occurrences="36" value="¨" /> + <ngram occurrences="36" value="áö" /> + <ngram occurrences="36" value="_ÿ" /> + <ngram occurrences="36" value="_ø" /> + <ngram occurrences="35" value="ä" /> + <ngram occurrences="35" value="_â" /> + <ngram occurrences="34" value="ß" /> + <ngram occurrences="34" value="_àì" /> + <ngram occurrences="33" value="ü" /> + <ngram occurrences="33" value="ó" /> + <ngram occurrences="33" value="_º" /> + <ngram occurrences="32" value="ø_" /> + <ngram occurrences="32" value="º_" /> + <ngram occurrences="31" value="ï_" /> + <ngram occurrences="30" value="¸â" /> + <ngram occurrences="29" value="àç_" /> + <ngram occurrences="28" value="¸â_" /> + <ngram occurrences="28" value="æ_" /> + <ngram occurrences="28" value="á_" /> + <ngram occurrences="28" value="µé" /> + <ngram occurrences="27" value="¨_" /> + <ngram occurrences="27" value="ñ_" /> + <ngram occurrences="27" value="ã_" /> + <ngram occurrences="27" value="³_" /> + <ngram occurrences="26" value="è_" /> + <ngram occurrences="26" value="_½_" /> + <ngram occurrences="25" value="ö_" /> + <ngram occurrences="25" value="çñ" /> + <ngram occurrences="25" value="_¸_" /> + <ngram occurrences="25" value="_è" /> + <ngram occurrences="25" value="_áö" /> + <ngram occurrences="24" value="¸¸" /> + <ngram occurrences="24" value="¸ç" /> + <ngram occurrences="24" value="_î" /> + <ngram occurrences="23" value="ý" /> + <ngram occurrences="23" value="ú_" /> + <ngram occurrences="23" value="ô" /> + <ngram occurrences="23" value="ð" /> + <ngram occurrences="23" value="àº" /> + <ngram occurrences="23" value="_æ" /> + <ngram occurrences="22" value="¸¨_" /> + <ngram occurrences="22" value="¸¨" /> + <ngram occurrences="22" value="àö" /> + <ngram occurrences="22" value="²" /> + <ngram occurrences="21" value="¸ë" /> + <ngram occurrences="21" value="û" /> + <ngram occurrences="21" value="ò" /> + <ngram occurrences="21" value="ê" /> + <ngram occurrences="21" value="é_" /> + <ngram occurrences="21" value="àº_" /> + <ngram occurrences="21" value="_ë" /> + <ngram occurrences="21" value="_àö" /> + <ngram occurrences="20" value="ö¸" /> + <ngram occurrences="20" value="çñ_" /> + <ngram occurrences="19" value="ä_" /> + <ngram occurrences="19" value="_î_" /> + <ngram occurrences="18" value="ë_" /> + <ngram occurrences="18" value="çï" /> + <ngram occurrences="18" value="à¸" /> + <ngram occurrences="18" value="ª" /> + <ngram occurrences="18" value="_ó" /> + <ngram occurrences="18" value="_å" /> + <ngram occurrences="17" value="éà" /> + <ngram occurrences="17" value="àú" /> + <ngram occurrences="17" value="àö¸" /> + <ngram occurrences="17" value="¹_" /> + <ngram occurrences="17" value="_³_" /> + <ngram occurrences="16" value="½ã" /> + <ngram occurrences="16" value="è¸" /> + <ngram occurrences="16" value="_ù" /> + <ngram occurrences="16" value="_àö¸" /> + <ngram occurrences="16" value="_àì_" /> + <ngram occurrences="15" value="ü_" /> + <ngram occurrences="15" value="áö_" /> + <ngram occurrences="15" value="_ú" /> + <ngram occurrences="15" value="_æ_" /> + <ngram occurrences="15" value="_á_" /> + <ngram occurrences="14" value="½º" /> + <ngram occurrences="14" value="ÿî" /> + <ngram occurrences="14" value="øà" /> + <ngram occurrences="14" value="ð_" /> + <ngram occurrences="14" value="àü" /> + <ngram occurrences="14" value="àï" /> + <ngram occurrences="14" value="ºî" /> + <ngram occurrences="14" value="µî" /> + <ngram occurrences="14" value="µéà" /> + <ngram occurrences="14" value="µµ" /> + <ngram occurrences="14" value="_ý" /> + <ngram occurrences="14" value="_ç_" /> + <ngram occurrences="14" value="_â_" /> + <ngram occurrences="14" value="_àç" /> + <ngram occurrences="13" value="¸ï" /> + <ngram occurrences="13" value="¸ç_" /> + <ngram occurrences="13" value="ÿæ" /> + <ngram occurrences="13" value="ù_à" /> + <ngram occurrences="13" value="ö¸ù" /> + <ngram occurrences="13" value="î¸" /> + <ngram occurrences="13" value="çà" /> + <ngram occurrences="13" value="å_" /> + <ngram occurrences="13" value="àö¸ù" /> + <ngram occurrences="13" value="߸" /> + <ngram occurrences="13" value="µé_" /> + <ngram occurrences="13" value="³ª" /> + <ngram occurrences="13" value="_ø_" /> + <ngram occurrences="13" value="_ô" /> + <ngram occurrences="12" value="ö¸ù_" /> + <ngram occurrences="12" value="ó_" /> + <ngram occurrences="12" value="í_à" /> + <ngram occurrences="12" value="ç߸ù_" /> + <ngram occurrences="12" value="ç߸ù" /> + <ngram occurrences="12" value="ç߸" /> + <ngram occurrences="12" value="çß" /> + <ngram occurrences="12" value="ç_à" /> + <ngram occurrences="12" value="àö¸ù_" /> + <ngram occurrences="12" value="߸ù_" /> + <ngram occurrences="12" value="߸ù" /> + <ngram occurrences="12" value="ß_" /> + <ngram occurrences="12" value="µµ_" /> + <ngram occurrences="12" value="_¸¸" /> + <ngram occurrences="12" value="_¸ù" /> + <ngram occurrences="12" value="_ù_" /> + <ngram occurrences="12" value="_àö¸ù" /> + <ngram occurrences="12" value="_¹_" /> + <ngram occurrences="12" value="_µî" /> + <ngram occurrences="11" value="õ" /> + <ngram occurrences="11" value="íà" /> + <ngram occurrences="11" value="ì¸" /> + <ngram occurrences="11" value="çï_" /> + <ngram occurrences="11" value="à¸_" /> + <ngram occurrences="11" value="àû" /> + <ngram occurrences="11" value="àú_" /> + <ngram occurrences="11" value="_¸ë" /> + <ngram occurrences="11" value="_øà" /> + <ngram occurrences="11" value="_í_à" /> + <ngram occurrences="11" value="_àï" /> + <ngram occurrences="11" value="_à_" /> + <ngram occurrences="10" value="¸ù_à" /> + <ngram occurrences="10" value="¸_î" /> + <ngram occurrences="10" value="ÿè" /> + <ngram occurrences="10" value="ý_" /> + <ngram occurrences="10" value="ê_" /> + <ngram occurrences="10" value="è¸_" /> + <ngram occurrences="10" value="ç¸" /> + <ngram occurrences="10" value="åë" /> + <ngram occurrences="10" value="ãµ" /> + <ngram occurrences="10" value="à¸_î" /> + <ngram occurrences="10" value="àì¸" /> + <ngram occurrences="10" value="º¸" /> + <ngram occurrences="10" value="ª_" /> + <ngram occurrences="10" value="_¸ç" /> + <ngram occurrences="10" value="_ï" /> + <ngram occurrences="10" value="_ê" /> + <ngram occurrences="10" value="_ã_" /> + <ngram occurrences="9" value="¸ù_í_" /> + <ngram occurrences="9" value="¸ù_í" /> + <ngram occurrences="9" value="¸_î_" /> + <ngram occurrences="9" value="¸_ç" /> + <ngram occurrences="9" value="¸_à" /> + <ngram occurrences="9" value="û_" /> + <ngram occurrences="9" value="ú¸" /> + <ngram occurrences="9" value="ù¸" /> + <ngram occurrences="9" value="ù_í_" /> + <ngram occurrences="9" value="ù_í" /> + <ngram occurrences="9" value="ô_" /> + <ngram occurrences="9" value="ó¸" /> + <ngram occurrences="9" value="ò_" /> + <ngram occurrences="9" value="í_àö¸" /> + <ngram occurrences="9" value="í_àö" /> + <ngram occurrences="9" value="çø" /> + <ngram occurrences="9" value="ç_½" /> + <ngram occurrences="9" value="â_á" /> + <ngram occurrences="9" value="á¨" /> + <ngram occurrences="9" value="áß" /> + <ngram occurrences="9" value="à¸_î_" /> + <ngram occurrences="9" value="àï_" /> + <ngram occurrences="9" value="àî" /> + <ngram occurrences="9" value="_¸¨_" /> + <ngram occurrences="9" value="_¸¨" /> + <ngram occurrences="9" value="_ô_" /> + <ngram occurrences="9" value="_ó_" /> + <ngram occurrences="9" value="_í_àö" /> + <ngram occurrences="9" value="_è_" /> + <ngram occurrences="9" value="_àç_" /> + <ngram occurrences="8" value="¸¸_" /> + <ngram occurrences="8" value="¸é" /> + <ngram occurrences="8" value="¸_ø" /> + <ngram occurrences="8" value="½ö" /> + <ngram occurrences="8" value="½_¸" /> + <ngram occurrences="8" value="ÿî¸" /> + <ngram occurrences="8" value="ÿç" /> + <ngram occurrences="8" value="ï¸" /> + <ngram occurrences="8" value="çô" /> + <ngram occurrences="8" value="çð_" /> + <ngram occurrences="8" value="çð" /> + <ngram occurrences="8" value="æ_â" /> + <ngram occurrences="8" value="â_à" /> + <ngram occurrences="8" value="áø" /> + <ngram occurrences="8" value="ºî_" /> + <ngram occurrences="8" value="¹à" /> + <ngram occurrences="8" value="²_" /> + <ngram occurrences="8" value="_ÿè" /> + <ngram occurrences="8" value="_ü" /> + <ngram occurrences="8" value="_ú_" /> + <ngram occurrences="8" value="_áö_" /> + <ngram occurrences="8" value="_àú" /> + <ngram occurrences="8" value="_àï_" /> + <ngram occurrences="8" value="_µ_" /> + <ngram occurrences="8" value="_³ª" /> + <ngram occurrences="7" value="¸ù¸" /> + <ngram occurrences="7" value="¸ù_àì" /> + <ngram occurrences="7" value="¸ó¸ï" /> + <ngram occurrences="7" value="¸ó¸" /> + <ngram occurrences="7" value="¸ó" /> + <ngram occurrences="7" value="¸í" /> + <ngram occurrences="7" value="¸â_á" /> + <ngram occurrences="7" value="½ò" /> + <ngram occurrences="7" value="½_à" /> + <ngram occurrences="7" value="ÿî¸ó¸" /> + <ngram occurrences="7" value="ÿî¸ó" /> + <ngram occurrences="7" value="þ" /> + <ngram occurrences="7" value="ýà" /> + <ngram occurrences="7" value="ù_àì" /> + <ngram occurrences="7" value="öÿ" /> + <ngram occurrences="7" value="ó¸ï" /> + <ngram occurrences="7" value="î¸ó¸ï" /> + <ngram occurrences="7" value="î¸ó¸" /> + <ngram occurrences="7" value="î¸ó" /> + <ngram occurrences="7" value="îà" /> + <ngram occurrences="7" value="éàì_" /> + <ngram occurrences="7" value="éàì" /> + <ngram occurrences="7" value="çè" /> + <ngram occurrences="7" value="çã" /> + <ngram occurrences="7" value="ç_½_" /> + <ngram occurrences="7" value="ç_àì" /> + <ngram occurrences="7" value="ç_³" /> + <ngram occurrences="7" value="æà" /> + <ngram occurrences="7" value="ã½" /> + <ngram occurrences="7" value="ãñ" /> + <ngram occurrences="7" value="ãµ_" /> + <ngram occurrences="7" value="âà" /> + <ngram occurrences="7" value="âµ" /> + <ngram occurrences="7" value="àü_" /> + <ngram occurrences="7" value="àå" /> + <ngram occurrences="7" value="¹ß" /> + <ngram occurrences="7" value="µî_" /> + <ngram occurrences="7" value="µéàì_" /> + <ngram occurrences="7" value="µéàì" /> + <ngram occurrences="7" value="³â" /> + <ngram occurrences="7" value="_ÿæ" /> + <ngram occurrences="7" value="_ï_" /> + <ngram occurrences="7" value="_íà" /> + <ngram occurrences="7" value="_ë_" /> + <ngram occurrences="7" value="_ê_" /> + <ngram occurrences="7" value="_è¸" /> + <ngram occurrences="7" value="_çø" /> + <ngram occurrences="7" value="_çï" /> + <ngram occurrences="7" value="_ç߸ù" /> + <ngram occurrences="7" value="_ç߸" /> + <ngram occurrences="7" value="_çß" /> + <ngram occurrences="7" value="_æ_â" /> + <ngram occurrences="7" value="_ä" /> + <ngram occurrences="7" value="_ãñ" /> + <ngram occurrences="7" value="_àü" /> + <ngram occurrences="7" value="_àì¸" /> + <ngram occurrences="7" value="_³â" /> + <ngram occurrences="6" value="¸ü" /> + <ngram occurrences="6" value="¸ø" /> + <ngram occurrences="6" value="¸µ" /> + <ngram occurrences="6" value="¸_¸" /> + <ngram occurrences="6" value="¸_ã" /> + <ngram occurrences="6" value="½ö_" /> + <ngram occurrences="6" value="½å" /> + <ngram occurrences="6" value="½ã_" /> + <ngram occurrences="6" value="ÿ_" /> + <ngram occurrences="6" value="øµ" /> + <ngram occurrences="6" value="õ_" /> + <ngram occurrences="6" value="ô²²_" /> + <ngram occurrences="6" value="ô²²" /> + <ngram occurrences="6" value="ô²" /> + <ngram occurrences="6" value="ìµ" /> + <ngram occurrences="6" value="ì_á" /> + <ngram occurrences="6" value="ëç" /> + <ngram occurrences="6" value="ëá" /> + <ngram occurrences="6" value="é¸" /> + <ngram occurrences="6" value="çô²²_" /> + <ngram occurrences="6" value="çô²²" /> + <ngram occurrences="6" value="çô²" /> + <ngram occurrences="6" value="çç" /> + <ngram occurrences="6" value="æä" /> + <ngram occurrences="6" value="å¸" /> + <ngram occurrences="6" value="ä_¸" /> + <ngram occurrences="6" value="ãç" /> + <ngram occurrences="6" value="ãà" /> + <ngram occurrences="6" value="áß_" /> + <ngram occurrences="6" value="á_à" /> + <ngram occurrences="6" value="àì_á" /> + <ngram occurrences="6" value="º¸_" /> + <ngram occurrences="6" value="º_¸" /> + <ngram occurrences="6" value="¹î" /> + <ngram occurrences="6" value="¹é" /> + <ngram occurrences="6" value="µîà" /> + <ngram occurrences="6" value="µç" /> + <ngram occurrences="6" value="³ª_" /> + <ngram occurrences="6" value="²²_" /> + <ngram occurrences="6" value="²²" /> + <ngram occurrences="6" value="_¸ç_" /> + <ngram occurrences="6" value="_½ö" /> + <ngram occurrences="6" value="_½å" /> + <ngram occurrences="6" value="_½ã" /> + <ngram occurrences="6" value="_ÿî¸" /> + <ngram occurrences="6" value="_ÿî" /> + <ngram occurrences="6" value="_çô" /> + <ngram occurrences="6" value="_ãµ" /> + <ngram occurrences="6" value="_âà" /> + <ngram occurrences="6" value="_àº" /> + <ngram occurrences="6" value="_º_" /> + <ngram occurrences="6" value="_¹é" /> + <ngram occurrences="6" value="_µîà" /> + <ngram occurrences="6" value="_µî_" /> + <ngram occurrences="6" value="_µé" /> + <ngram occurrences="5" value="¸¸µ" /> + <ngram occurrences="5" value="¸ù_¸" /> + <ngram occurrences="5" value="¸ø_" /> + <ngram occurrences="5" value="¸ë_" /> + <ngram occurrences="5" value="¸â_áö" /> + <ngram occurrences="5" value="¸_½" /> + <ngram occurrences="5" value="¸_ç߸" /> + <ngram occurrences="5" value="¸_çß" /> + <ngram occurrences="5" value="¨_ã" /> + <ngram occurrences="5" value="½½" /> + <ngram occurrences="5" value="½ºä" /> + <ngram occurrences="5" value="½º_" /> + <ngram occurrences="5" value="½_ç" /> + <ngram occurrences="5" value="üç" /> + <ngram occurrences="5" value="ü_ë" /> + <ngram occurrences="5" value="ûà" /> + <ngram occurrences="5" value="ú¸ù" /> + <ngram occurrences="5" value="ù_¸" /> + <ngram occurrences="5" value="ù_½" /> + <ngram occurrences="5" value="ù_àì_" /> + <ngram occurrences="5" value="øç" /> + <ngram occurrences="5" value="öà" /> + <ngram occurrences="5" value="ö³_" /> + <ngram occurrences="5" value="ö³" /> + <ngram occurrences="5" value="ö_¸" /> + <ngram occurrences="5" value="ñ_¹" /> + <ngram occurrences="5" value="ïµ" /> +</ngrams> diff --git a/src/plugins/language/latin.klp b/src/plugins/language/latin.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="723" value="_" /> + <ngram occurrences="473" value="e" /> + <ngram occurrences="437" value="i" /> + <ngram occurrences="363" value="a" /> + <ngram occurrences="344" value="u" /> + <ngram occurrences="332" value="t" /> + <ngram occurrences="312" value="s" /> + <ngram occurrences="279" value="r" /> + <ngram occurrences="240" value="m" /> + <ngram occurrences="229" value="o" /> + <ngram occurrences="228" value="n" /> + <ngram occurrences="161" value="s_" /> + <ngram occurrences="154" value="c" /> + <ngram occurrences="143" value="l" /> + <ngram occurrences="124" value="e_" /> + <ngram occurrences="120" value="p" /> + <ngram occurrences="106" value="d" /> + <ngram occurrences="100" value="t_" /> + <ngram occurrences="99" value="m_" /> + <ngram occurrences="86" value="qu" /> + <ngram occurrences="86" value="q" /> + <ngram occurrences="79" value="er" /> + <ngram occurrences="71" value="is" /> + <ngram occurrences="71" value="a_" /> + <ngram occurrences="71" value="_i" /> + <ngram occurrences="70" value="_a" /> + <ngram occurrences="68" value="v" /> + <ngram occurrences="67" value="um" /> + <ngram occurrences="63" value="re" /> + <ngram occurrences="61" value="te" /> + <ngram occurrences="59" value="_s" /> + <ngram occurrences="56" value="it" /> + <ngram occurrences="56" value="is_" /> + <ngram occurrences="55" value="ue" /> + <ngram occurrences="55" value="in" /> + <ngram occurrences="55" value="_p" /> + <ngram occurrences="55" value="_e" /> + <ngram occurrences="54" value="us" /> + <ngram occurrences="52" value="b" /> + <ngram occurrences="51" value="i_" /> + <ngram occurrences="51" value="_c" /> + <ngram occurrences="49" value="que" /> + <ngram occurrences="48" value="um_" /> + <ngram occurrences="48" value="nt" /> + <ngram occurrences="48" value="at" /> + <ngram occurrences="47" value="ra" /> + <ngram occurrences="45" value="us_" /> + <ngram occurrences="45" value="ue_" /> + <ngram occurrences="45" value="que_" /> + <ngram occurrences="45" value="_t" /> + <ngram occurrences="44" value="or" /> + <ngram occurrences="44" value="en" /> + <ngram occurrences="43" value="ti" /> + <ngram occurrences="43" value="h" /> + <ngram occurrences="42" value="g" /> + <ngram occurrences="42" value="f" /> + <ngram occurrences="41" value="et" /> + <ngram occurrences="40" value="li" /> + <ngram occurrences="40" value="am" /> + <ngram occurrences="40" value="_m" /> + <ngram occurrences="39" value="tu" /> + <ngram occurrences="39" value="_d" /> + <ngram occurrences="38" value="ro" /> + <ngram occurrences="38" value="em" /> + <ngram occurrences="37" value="o_" /> + <ngram occurrences="34" value="et_" /> + <ngram occurrences="33" value="os" /> + <ngram occurrences="33" value="an" /> + <ngram occurrences="33" value="_v" /> + <ngram occurrences="33" value="_f" /> + <ngram occurrences="32" value="ta" /> + <ngram occurrences="31" value="ia" /> + <ngram occurrences="30" value="ur" /> + <ngram occurrences="30" value="r_" /> + <ngram occurrences="30" value="de" /> + <ngram occurrences="30" value="ae" /> + <ngram occurrences="29" value="ri" /> + <ngram occurrences="29" value="pe" /> + <ngram occurrences="29" value="on" /> + <ngram occurrences="29" value="mi" /> + <ngram occurrences="29" value="_h" /> + <ngram occurrences="29" value="_et_" /> + <ngram occurrences="29" value="_et" /> + <ngram occurrences="28" value="ui" /> + <ngram occurrences="28" value="si" /> + <ngram occurrences="27" value="ni" /> + <ngram occurrences="27" value="la" /> + <ngram occurrences="27" value="es" /> + <ngram occurrences="27" value="_n" /> + <ngram occurrences="26" value="s_a" /> + <ngram occurrences="26" value="na" /> + <ngram occurrences="26" value="im" /> + <ngram occurrences="26" value="ic" /> + <ngram occurrences="26" value="am_" /> + <ngram occurrences="26" value="_in" /> + <ngram occurrences="25" value="ma" /> + <ngram occurrences="25" value="_qu" /> + <ngram occurrences="25" value="_q" /> + <ngram occurrences="24" value="vi" /> + <ngram occurrences="24" value="st" /> + <ngram occurrences="24" value="re_" /> + <ngram occurrences="24" value="em_" /> + <ngram occurrences="24" value="_r" /> + <ngram occurrences="24" value="_l" /> + <ngram occurrences="23" value="di" /> + <ngram occurrences="22" value="ve" /> + <ngram occurrences="22" value="tr" /> + <ngram occurrences="22" value="ns" /> + <ngram occurrences="22" value="id" /> + <ngram occurrences="21" value="ul" /> + <ngram occurrences="21" value="to" /> + <ngram occurrences="21" value="su" /> + <ngram occurrences="21" value="ne" /> + <ngram occurrences="21" value="it_" /> + <ngram occurrences="21" value="cu" /> + <ngram occurrences="21" value="ci" /> + <ngram occurrences="21" value="as" /> + <ngram occurrences="20" value="un" /> + <ngram occurrences="20" value="os_" /> + <ngram occurrences="20" value="hi" /> + <ngram occurrences="20" value="el" /> + <ngram occurrences="20" value="ct" /> + <ngram occurrences="20" value="co" /> + <ngram occurrences="20" value="c_" /> + <ngram occurrences="19" value="te_" /> + <ngram occurrences="19" value="s_i" /> + <ngram occurrences="19" value="s_e" /> + <ngram occurrences="19" value="ru" /> + <ngram occurrences="19" value="pr" /> + <ngram occurrences="19" value="mu" /> + <ngram occurrences="19" value="ere" /> + <ngram occurrences="19" value="_te" /> + <ngram occurrences="18" value="se" /> + <ngram occurrences="18" value="qui" /> + <ngram occurrences="18" value="ol" /> + <ngram occurrences="18" value="no" /> + <ngram occurrences="18" value="le" /> + <ngram occurrences="18" value="il" /> + <ngram occurrences="18" value="ec" /> + <ngram occurrences="18" value="au" /> + <ngram occurrences="18" value="ar" /> + <ngram occurrences="18" value="_o" /> + <ngram occurrences="17" value="sa" /> + <ngram occurrences="17" value="nt_" /> + <ngram occurrences="17" value="m_i" /> + <ngram occurrences="17" value="at_" /> + <ngram occurrences="16" value="ter" /> + <ngram occurrences="16" value="n_" /> + <ngram occurrences="16" value="ll" /> + <ngram occurrences="16" value="ent" /> + <ngram occurrences="16" value="e_p" /> + <ngram occurrences="16" value="do" /> + <ngram occurrences="16" value="_pr" /> + <ngram occurrences="15" value="rt" /> + <ngram occurrences="15" value="pi" /> + <ngram occurrences="15" value="nu" /> + <ngram occurrences="15" value="ere_" /> + <ngram occurrences="15" value="er_" /> + <ngram occurrences="15" value="e_s" /> + <ngram occurrences="15" value="ca" /> + <ngram occurrences="15" value="as_" /> + <ngram occurrences="15" value="al" /> + <ngram occurrences="15" value="ac" /> + <ngram occurrences="15" value="_si" /> + <ngram occurrences="15" value="_re" /> + <ngram occurrences="15" value="_pe" /> + <ngram occurrences="14" value="sque_" /> + <ngram occurrences="14" value="sque" /> + <ngram occurrences="14" value="squ" /> + <ngram occurrences="14" value="sq" /> + <ngram occurrences="14" value="per" /> + <ngram occurrences="14" value="om" /> + <ngram occurrences="14" value="mo" /> + <ngram occurrences="14" value="me" /> + <ngram occurrences="14" value="iu" /> + <ngram occurrences="14" value="ib" /> + <ngram occurrences="14" value="es_" /> + <ngram occurrences="14" value="ce" /> + <ngram occurrences="14" value="ant" /> + <ngram occurrences="14" value="_u" /> + <ngram occurrences="14" value="_su" /> + <ngram occurrences="14" value="_co" /> + <ngram occurrences="14" value="_au" /> + <ngram occurrences="13" value="x" /> + <ngram occurrences="13" value="tis" /> + <ngram occurrences="13" value="ra_" /> + <ngram occurrences="13" value="pro" /> + <ngram occurrences="13" value="pa" /> + <ngram occurrences="13" value="na_" /> + <ngram occurrences="13" value="lu" /> + <ngram occurrences="13" value="is_a" /> + <ngram occurrences="13" value="e_t" /> + <ngram occurrences="13" value="da" /> + <ngram occurrences="13" value="_vi" /> + <ngram occurrences="13" value="_no" /> + <ngram occurrences="13" value="_ma" /> + <ngram occurrences="13" value="_hi" /> + <ngram occurrences="13" value="_de" /> + <ngram occurrences="12" value="vo" /> + <ngram occurrences="12" value="unt" /> + <ngram occurrences="12" value="uis" /> + <ngram occurrences="12" value="tis_" /> + <ngram occurrences="12" value="ti_" /> + <ngram occurrences="12" value="tem" /> + <ngram occurrences="12" value="ss" /> + <ngram occurrences="12" value="s_et_" /> + <ngram occurrences="12" value="s_et" /> + <ngram occurrences="12" value="pu" /> + <ngram occurrences="12" value="po" /> + <ngram occurrences="12" value="nd" /> + <ngram occurrences="12" value="lo" /> + <ngram occurrences="12" value="ir" /> + <ngram occurrences="12" value="iam" /> + <ngram occurrences="12" value="ia_" /> + <ngram occurrences="12" value="fe" /> + <ngram occurrences="12" value="era" /> + <ngram occurrences="12" value="ens" /> + <ngram occurrences="12" value="_ve" /> + <ngram occurrences="12" value="_sa" /> + <ngram occurrences="12" value="_pro" /> + <ngram occurrences="12" value="_pa" /> + <ngram occurrences="12" value="_la" /> + <ngram occurrences="11" value="us_a" /> + <ngram occurrences="11" value="up" /> + <ngram occurrences="11" value="uo" /> + <ngram occurrences="11" value="ta_" /> + <ngram occurrences="11" value="s_s" /> + <ngram occurrences="11" value="s_p" /> + <ngram occurrences="11" value="s_in" /> + <ngram occurrences="11" value="rum_" /> + <ngram occurrences="11" value="rum" /> + <ngram occurrences="11" value="quo" /> + <ngram occurrences="11" value="nti" /> + <ngram occurrences="11" value="nte" /> + <ngram occurrences="11" value="mp" /> + <ngram occurrences="11" value="equ" /> + <ngram occurrences="11" value="eq" /> + <ngram occurrences="11" value="cum" /> + <ngram occurrences="11" value="bi" /> + <ngram occurrences="11" value="ag" /> + <ngram occurrences="11" value="a_c" /> + <ngram occurrences="11" value="_im" /> + <ngram occurrences="11" value="_cu" /> + <ngram occurrences="11" value="_ca" /> + <ngram occurrences="10" value="ut" /> + <ngram occurrences="10" value="tum" /> + <ngram occurrences="10" value="tor" /> + <ngram occurrences="10" value="tem_" /> + <ngram occurrences="10" value="t_i" /> + <ngram occurrences="10" value="rr" /> + <ngram occurrences="10" value="ros" /> + <ngram occurrences="10" value="rat" /> + <ngram occurrences="10" value="ora" /> + <ngram occurrences="10" value="ns_" /> + <ngram occurrences="10" value="nis" /> + <ngram occurrences="10" value="nc" /> + <ngram occurrences="10" value="ic_" /> + <ngram occurrences="10" value="ibu" /> + <ngram occurrences="10" value="gn" /> + <ngram occurrences="10" value="gi" /> + <ngram occurrences="10" value="ex" /> + <ngram occurrences="10" value="ect" /> + <ngram occurrences="10" value="e_r" /> + <ngram occurrences="10" value="du" /> + <ngram occurrences="10" value="bu" /> + <ngram occurrences="10" value="ba" /> + <ngram occurrences="10" value="av" /> + <ngram occurrences="10" value="_tr" /> + <ngram occurrences="10" value="_quo" /> + <ngram occurrences="10" value="_il" /> + <ngram occurrences="10" value="_fe" /> + <ngram occurrences="10" value="_ac" /> + <ngram occurrences="9" value="ver" /> + <ngram occurrences="9" value="unt_" /> + <ngram occurrences="9" value="tur" /> + <ngram occurrences="9" value="tum_" /> + <ngram occurrences="9" value="t_e" /> + <ngram occurrences="9" value="si_" /> + <ngram occurrences="9" value="s_m" /> + <ngram occurrences="9" value="op" /> + <ngram occurrences="9" value="oc" /> + <ngram occurrences="9" value="itu" /> + <ngram occurrences="9" value="ie" /> + <ngram occurrences="9" value="ibus" /> + <ngram occurrences="9" value="iam_" /> + <ngram occurrences="9" value="fer" /> + <ngram occurrences="9" value="ev" /> + <ngram occurrences="9" value="eri" /> + <ngram occurrences="9" value="ep" /> + <ngram occurrences="9" value="eli" /> + <ngram occurrences="9" value="e_a" /> + <ngram occurrences="9" value="bus" /> + <ngram occurrences="9" value="ate" /> + <ngram occurrences="9" value="ad" /> + <ngram occurrences="9" value="_se" /> + <ngram occurrences="9" value="_po" /> + <ngram occurrences="9" value="_fer" /> + <ngram occurrences="9" value="_do" /> + <ngram occurrences="9" value="_da" /> + <ngram occurrences="9" value="_ae" /> + <ngram occurrences="8" value="uis_" /> + <ngram occurrences="8" value="uc" /> + <ngram occurrences="8" value="ua" /> + <ngram occurrences="8" value="tus" /> + <ngram occurrences="8" value="tro" /> + <ngram occurrences="8" value="ter_" /> + <ngram occurrences="8" value="t_s" /> + <ngram occurrences="8" value="t_a" /> + <ngram occurrences="8" value="s_t" /> + <ngram occurrences="8" value="s_qu" /> + <ngram occurrences="8" value="s_q" /> + <ngram occurrences="8" value="s_c" /> + <ngram occurrences="8" value="ro_" /> + <ngram occurrences="8" value="rem" /> + <ngram occurrences="8" value="rat_" /> + <ngram occurrences="8" value="ora_" /> + <ngram occurrences="8" value="ntem" /> + <ngram occurrences="8" value="non" /> + <ngram occurrences="8" value="nis_" /> + <ngram occurrences="8" value="ng" /> + <ngram occurrences="8" value="mqu" /> + <ngram occurrences="8" value="mq" /> + <ngram occurrences="8" value="min" /> + <ngram occurrences="8" value="m_s" /> + <ngram occurrences="8" value="m_c" /> + <ngram occurrences="8" value="lia" /> + <ngram occurrences="8" value="ite" /> + <ngram occurrences="8" value="ip" /> + <ngram occurrences="8" value="imp" /> + <ngram occurrences="8" value="ill" /> + <ngram occurrences="8" value="ig" /> + <ngram occurrences="8" value="ibus_" /> + <ngram occurrences="8" value="hic_" /> + <ngram occurrences="8" value="hic" /> + <ngram occurrences="8" value="fu" /> + <ngram occurrences="8" value="eu" /> + <ngram occurrences="8" value="ens_" /> + <ngram occurrences="8" value="ed" /> + <ngram occurrences="8" value="eb" /> + <ngram occurrences="8" value="e_v" /> + <ngram occurrences="8" value="d_" /> + <ngram occurrences="8" value="cum_" /> + <ngram occurrences="8" value="cto" /> + <ngram occurrences="8" value="cr" /> + <ngram occurrences="8" value="bus_" /> + <ngram occurrences="8" value="be" /> + <ngram occurrences="8" value="ap" /> + <ngram occurrences="8" value="ab" /> + <ngram occurrences="8" value="_mo" /> + <ngram occurrences="8" value="_me" /> + <ngram occurrences="8" value="_imp" /> + <ngram occurrences="8" value="_hic_" /> + <ngram occurrences="8" value="_hic" /> + <ngram occurrences="7" value="us_e" /> + <ngram occurrences="7" value="ur_" /> + <ngram occurrences="7" value="um_i" /> + <ngram occurrences="7" value="uit" /> + <ngram occurrences="7" value="ue_p" /> + <ngram occurrences="7" value="ue_a" /> + <ngram occurrences="7" value="ud" /> + <ngram occurrences="7" value="tque_" /> + <ngram occurrences="7" value="tque" /> + <ngram occurrences="7" value="tqu" /> + <ngram occurrences="7" value="tq" /> + <ngram occurrences="7" value="t_f" /> + <ngram occurrences="7" value="t_c" /> + <ngram occurrences="7" value="se_" /> + <ngram occurrences="7" value="sc" /> + <ngram occurrences="7" value="s_h" /> + <ngram occurrences="7" value="ros_" /> + <ngram occurrences="7" value="ris" /> + <ngram occurrences="7" value="quis_" /> + <ngram occurrences="7" value="quis" /> + <ngram occurrences="7" value="que_p" /> + <ngram occurrences="7" value="que_a" /> + <ngram occurrences="7" value="pt" /> + <ngram occurrences="7" value="or_" /> + <ngram occurrences="7" value="oqu" /> + <ngram occurrences="7" value="oq" /> + <ngram occurrences="7" value="on_" /> + <ngram occurrences="7" value="omn" /> + <ngram occurrences="7" value="oe" /> + <ngram occurrences="7" value="ntem_" /> + <ngram occurrences="7" value="non_" /> + <ngram occurrences="7" value="mn" /> + <ngram occurrences="7" value="mit" /> + <ngram occurrences="7" value="m_n" /> + <ngram occurrences="7" value="m_h" /> + <ngram occurrences="7" value="m_d" /> + <ngram occurrences="7" value="m_a" /> + <ngram occurrences="7" value="lt" /> + <ngram occurrences="7" value="lle" /> + <ngram occurrences="7" value="is_i" /> + <ngram occurrences="7" value="ine" /> + <ngram occurrences="7" value="ina_" /> + <ngram occurrences="7" value="ina" /> + <ngram occurrences="7" value="in_" /> + <ngram occurrences="7" value="imu" /> + <ngram occurrences="7" value="i_s" /> + <ngram occurrences="7" value="ho" /> +</ngrams> diff --git a/src/plugins/language/latvian.klp b/src/plugins/language/latvian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="618" value="_" /> + <ngram occurrences="463" value="a" /> + <ngram occurrences="354" value="i" /> + <ngram occurrences="328" value="s" /> + <ngram occurrences="260" value="t" /> + <ngram occurrences="230" value="e" /> + <ngram occurrences="223" value="u" /> + <ngram occurrences="211" value="n" /> + <ngram occurrences="201" value="r" /> + <ngram occurrences="179" value="m" /> + <ngram occurrences="176" value="s_" /> + <ngram occurrences="144" value="o" /> + <ngram occurrences="143" value="k" /> + <ngram occurrences="142" value="â" /> + <ngram occurrences="136" value="p" /> + <ngram occurrences="118" value="l" /> + <ngram occurrences="100" value="î" /> + <ngram occurrences="96" value="ie" /> + <ngram occurrences="94" value="v" /> + <ngram occurrences="93" value="j" /> + <ngram occurrences="92" value="d" /> + <ngram occurrences="86" value="a_" /> + <ngram occurrences="75" value="u_" /> + <ngram occurrences="75" value="as" /> + <ngram occurrences="73" value="_p" /> + <ngram occurrences="69" value="ç" /> + <ngram occurrences="69" value="z" /> + <ngram occurrences="66" value="as_" /> + <ngram occurrences="60" value="_n" /> + <ngram occurrences="59" value="b" /> + <ngram occurrences="58" value="ð" /> + <ngram occurrences="57" value="_a" /> + <ngram occurrences="55" value="um" /> + <ngram occurrences="54" value="g" /> + <ngram occurrences="53" value="ar" /> + <ngram occurrences="51" value="_v" /> + <ngram occurrences="46" value="_k" /> + <ngram occurrences="45" value="ti" /> + <ngram occurrences="45" value="pa" /> + <ngram occurrences="44" value="i_" /> + <ngram occurrences="43" value="c" /> + <ngram occurrences="41" value="es" /> + <ngram occurrences="41" value="_t" /> + <ngram occurrences="40" value="no" /> + <ngram occurrences="40" value="ma" /> + <ngram occurrences="39" value="at" /> + <ngram occurrences="38" value="ta" /> + <ngram occurrences="38" value="en" /> + <ngram occurrences="37" value="st" /> + <ngram occurrences="36" value="_i" /> + <ngram occurrences="35" value="va" /> + <ngram occurrences="35" value="ja" /> + <ngram occurrences="34" value="r_" /> + <ngram occurrences="34" value="_s" /> + <ngram occurrences="33" value="is" /> + <ngram occurrences="33" value="in" /> + <ngram occurrences="33" value="_u" /> + <ngram occurrences="33" value="_no" /> + <ngram occurrences="32" value="ai" /> + <ngram occurrences="31" value="_pa" /> + <ngram occurrences="30" value="â_" /> + <ngram occurrences="30" value="ra" /> + <ngram occurrences="30" value="ju" /> + <ngram occurrences="30" value="em" /> + <ngram occurrences="30" value="an" /> + <ngram occurrences="29" value="n_" /> + <ngram occurrences="29" value="m_" /> + <ngram occurrences="28" value="sa" /> + <ngram occurrences="28" value="pr" /> + <ngram occurrences="28" value="o_" /> + <ngram occurrences="28" value="ij" /> + <ngram occurrences="28" value="_l" /> + <ngram occurrences="27" value="un" /> + <ngram occurrences="27" value="tie" /> + <ngram occurrences="27" value="te" /> + <ngram occurrences="27" value="ri" /> + <ngram occurrences="27" value="iz" /> + <ngram occurrences="26" value="na" /> + <ngram occurrences="26" value="mi" /> + <ngram occurrences="25" value="ik" /> + <ngram occurrences="25" value="_va" /> + <ngram occurrences="25" value="_d" /> + <ngram occurrences="24" value="vi" /> + <ngram occurrences="24" value="ar_" /> + <ngram occurrences="23" value="un_" /> + <ngram occurrences="23" value="s_p" /> + <ngram occurrences="23" value="ot" /> + <ngram occurrences="23" value="nâ" /> + <ngram occurrences="23" value="ku" /> + <ngram occurrences="23" value="_un_" /> + <ngram occurrences="23" value="_un" /> + <ngram occurrences="22" value="îb" /> + <ngram occurrences="22" value="ts" /> + <ngram occurrences="22" value="ne" /> + <ngram occurrences="22" value="la" /> + <ngram occurrences="22" value="ka" /> + <ngram occurrences="22" value="iem" /> + <ngram occurrences="22" value="au" /> + <ngram occurrences="22" value="ap" /> + <ngram occurrences="21" value="t_" /> + <ngram occurrences="21" value="ro" /> + <ngram occurrences="21" value="ko" /> + <ngram occurrences="21" value="al" /> + <ngram occurrences="20" value="îg" /> + <ngram occurrences="20" value="tâ" /> + <ngram occurrences="20" value="ei" /> + <ngram occurrences="20" value="ba" /> + <ngram occurrences="20" value="_m" /> + <ngram occurrences="20" value="_iz" /> + <ngram occurrences="20" value="_ar" /> + <ngram occurrences="19" value="ða" /> + <ngram occurrences="19" value="tu" /> + <ngram occurrences="19" value="s_a" /> + <ngram occurrences="19" value="ms_" /> + <ngram occurrences="19" value="ms" /> + <ngram occurrences="19" value="ija" /> + <ngram occurrences="19" value="am" /> + <ngram occurrences="18" value="âs_" /> + <ngram occurrences="18" value="âs" /> + <ngram occurrences="18" value="tr" /> + <ngram occurrences="18" value="pi" /> + <ngram occurrences="18" value="nt" /> + <ngram occurrences="18" value="ma_" /> + <ngram occurrences="18" value="lî" /> + <ngram occurrences="18" value="jum" /> + <ngram occurrences="18" value="iem_" /> + <ngram occurrences="18" value="es_" /> + <ngram occurrences="18" value="em_" /> + <ngram occurrences="18" value="ek" /> + <ngram occurrences="18" value="dz" /> + <ngram occurrences="18" value="ci" /> + <ngram occurrences="18" value="_ko" /> + <ngram occurrences="17" value="s_v" /> + <ngram occurrences="17" value="mu" /> + <ngram occurrences="17" value="kâ" /> + <ngram occurrences="17" value="ir" /> + <ngram occurrences="17" value="ies" /> + <ngram occurrences="17" value="ien" /> + <ngram occurrences="17" value="gu" /> + <ngram occurrences="17" value="ga" /> + <ngram occurrences="17" value="_ti" /> + <ngram occurrences="17" value="_pr" /> + <ngram occurrences="17" value="_ne" /> + <ngram occurrences="16" value="uma_" /> + <ngram occurrences="16" value="uma" /> + <ngram occurrences="16" value="ts_" /> + <ngram occurrences="16" value="si" /> + <ngram occurrences="16" value="s_n" /> + <ngram occurrences="16" value="rî" /> + <ngram occurrences="16" value="inâ" /> + <ngram occurrences="16" value="_at" /> + <ngram occurrences="15" value="îba" /> + <ngram occurrences="15" value="zî" /> + <ngram occurrences="15" value="us" /> + <ngram occurrences="15" value="om" /> + <ngram occurrences="15" value="li" /> + <ngram occurrences="15" value="kum" /> + <ngram occurrences="15" value="ja_" /> + <ngram occurrences="15" value="et" /> + <ngram occurrences="15" value="da" /> + <ngram occurrences="15" value="_sa" /> + <ngram occurrences="14" value="ðan" /> + <ngram occurrences="14" value="ums_" /> + <ngram occurrences="14" value="ums" /> + <ngram occurrences="14" value="ties" /> + <ngram occurrences="14" value="s_k" /> + <ngram occurrences="14" value="pie" /> + <ngram occurrences="14" value="par" /> + <ngram occurrences="14" value="mâ" /> + <ngram occurrences="14" value="jâ" /> + <ngram occurrences="14" value="_tie" /> + <ngram occurrences="14" value="_r" /> + <ngram occurrences="14" value="_pi" /> + <ngram occurrences="14" value="_par" /> + <ngram occurrences="13" value="û" /> + <ngram occurrences="13" value="ò" /> + <ngram occurrences="13" value="ði" /> + <ngram occurrences="13" value="ï" /> + <ngram occurrences="13" value="çr" /> + <ngram occurrences="13" value="çj" /> + <ngram occurrences="13" value="âj" /> + <ngram occurrences="13" value="âd" /> + <ngram occurrences="13" value="ta_" /> + <ngram occurrences="13" value="ni" /> + <ngram occurrences="13" value="_pie" /> + <ngram occurrences="13" value="_g" /> + <ngram occurrences="13" value="_c" /> + <ngram occurrences="13" value="_b" /> + <ngram occurrences="12" value="âl" /> + <ngram occurrences="12" value="âk" /> + <ngram occurrences="12" value="vç" /> + <ngram occurrences="12" value="tu_" /> + <ngram occurrences="12" value="to" /> + <ngram occurrences="12" value="sk" /> + <ngram occurrences="12" value="s_s" /> + <ngram occurrences="12" value="rt" /> + <ngram occurrences="12" value="lç" /> + <ngram occurrences="12" value="kt" /> + <ngram occurrences="12" value="gum" /> + <ngram occurrences="12" value="ent" /> + <ngram occurrences="12" value="di" /> + <ngram occurrences="12" value="bi" /> + <ngram occurrences="12" value="ai_" /> + <ngram occurrences="12" value="_vi" /> + <ngram occurrences="11" value="îgu" /> + <ngram occurrences="11" value="îbas_" /> + <ngram occurrences="11" value="îbas" /> + <ngram occurrences="11" value="î_" /> + <ngram occurrences="11" value="val" /> + <ngram occurrences="11" value="umu" /> + <ngram occurrences="11" value="sp" /> + <ngram occurrences="11" value="s_i" /> + <ngram occurrences="11" value="râ" /> + <ngram occurrences="11" value="ru" /> + <ngram occurrences="11" value="os" /> + <ngram occurrences="11" value="on" /> + <ngram occurrences="11" value="mu_" /> + <ngram occurrences="11" value="ks" /> + <ngram occurrences="11" value="jas_" /> + <ngram occurrences="11" value="jas" /> + <ngram occurrences="11" value="eik" /> + <ngram occurrences="11" value="dî" /> + <ngram occurrences="11" value="bas_" /> + <ngram occurrences="11" value="bas" /> + <ngram occurrences="11" value="ak" /> + <ngram occurrences="11" value="ad" /> + <ngram occurrences="11" value="_ar_" /> + <ngram occurrences="11" value="__" /> + <ngram occurrences="10" value="îgum" /> + <ngram occurrences="10" value="âm" /> + <ngram occurrences="10" value="vie" /> + <ngram occurrences="10" value="ut" /> + <ngram occurrences="10" value="umu_" /> + <ngram occurrences="10" value="u_p" /> + <ngram occurrences="10" value="teik" /> + <ngram occurrences="10" value="tei" /> + <ngram occurrences="10" value="se" /> + <ngram occurrences="10" value="s_u" /> + <ngram occurrences="10" value="s_pa" /> + <ngram occurrences="10" value="re" /> + <ngram occurrences="10" value="pro" /> + <ngram occurrences="10" value="nî" /> + <ngram occurrences="10" value="no_" /> + <ngram occurrences="10" value="me" /> + <ngram occurrences="10" value="lîg" /> + <ngram occurrences="10" value="ls" /> + <ngram occurrences="10" value="ld" /> + <ngram occurrences="10" value="ju_" /> + <ngram occurrences="10" value="is_" /> + <ngram occurrences="10" value="ikum" /> + <ngram occurrences="10" value="iku" /> + <ngram occurrences="10" value="ijas_" /> + <ngram occurrences="10" value="ijas" /> + <ngram occurrences="10" value="f" /> + <ngram occurrences="10" value="eð" /> + <ngram occurrences="10" value="de" /> + <ngram occurrences="10" value="a_k" /> + <ngram occurrences="10" value="_ð" /> + <ngram occurrences="10" value="_vç" /> + <ngram occurrences="10" value="_ties" /> + <ngram occurrences="10" value="_no_" /> + <ngram occurrences="10" value="_la" /> + <ngram occurrences="10" value="_ka" /> + <ngram occurrences="10" value="___" /> + <ngram occurrences="9" value="çl" /> + <ngram occurrences="9" value="ât" /> + <ngram occurrences="9" value="âju" /> + <ngram occurrences="9" value="vien" /> + <ngram occurrences="9" value="vai" /> + <ngram occurrences="9" value="u_n" /> + <ngram occurrences="9" value="sî" /> + <ngram occurrences="9" value="s_va" /> + <ngram occurrences="9" value="s_t" /> + <ngram occurrences="9" value="s_no" /> + <ngram occurrences="9" value="rî_" /> + <ngram occurrences="9" value="pri" /> + <ngram occurrences="9" value="oð" /> + <ngram occurrences="9" value="oj" /> + <ngram occurrences="9" value="nu" /> + <ngram occurrences="9" value="ns" /> + <ngram occurrences="9" value="na_" /> + <ngram occurrences="9" value="mç" /> + <ngram occurrences="9" value="lîgum" /> + <ngram occurrences="9" value="lîgu" /> + <ngram occurrences="9" value="lst" /> + <ngram occurrences="9" value="kom" /> + <ngram occurrences="9" value="jâ_" /> + <ngram occurrences="9" value="il" /> + <ngram occurrences="9" value="ija_" /> + <ngram occurrences="9" value="iek" /> + <ngram occurrences="9" value="dzî" /> + <ngram occurrences="9" value="ce" /> + <ngram occurrences="9" value="að" /> + <ngram occurrences="9" value="av" /> + <ngram occurrences="9" value="as_p" /> + <ngram occurrences="9" value="arî" /> + <ngram occurrences="9" value="ais" /> + <ngram occurrences="9" value="_vai" /> + <ngram occurrences="9" value="_lî" /> + <ngram occurrences="9" value="_kom" /> + <ngram occurrences="9" value="_ga" /> + <ngram occurrences="9" value="_e" /> + <ngram occurrences="9" value="_ap" /> + <ngram occurrences="9" value="____" /> + <ngram occurrences="8" value="ût" /> + <ngram occurrences="8" value="îr" /> + <ngram occurrences="8" value="ç_" /> + <ngram occurrences="8" value="âr" /> + <ngram occurrences="8" value="âjum" /> + <ngram occurrences="8" value="vo" /> + <ngram occurrences="8" value="uz" /> + <ngram occurrences="8" value="s_ko" /> + <ngram occurrences="8" value="s_g" /> + <ngram occurrences="8" value="s_d" /> + <ngram occurrences="8" value="rie" /> + <ngram occurrences="8" value="pap" /> + <ngram occurrences="8" value="or" /> + <ngram occurrences="8" value="nu_" /> + <ngram occurrences="8" value="nos" /> + <ngram occurrences="8" value="men" /> + <ngram occurrences="8" value="it" /> + <ngram occurrences="8" value="ir_" /> + <ngram occurrences="8" value="ikt" /> + <ngram occurrences="8" value="esa" /> + <ngram occurrences="8" value="aut" /> + <ngram occurrences="8" value="as_k" /> + <ngram occurrences="8" value="arî_" /> + <ngram occurrences="8" value="ana" /> + <ngram occurrences="8" value="a_v" /> + <ngram occurrences="8" value="a_u" /> + <ngram occurrences="8" value="a_s" /> + <ngram occurrences="8" value="a_p" /> + <ngram occurrences="8" value="a_a" /> + <ngram occurrences="8" value="_val" /> + <ngram occurrences="8" value="_uz" /> + <ngram occurrences="8" value="_ta" /> + <ngram occurrences="8" value="_ra" /> + <ngram occurrences="8" value="_li" /> + <ngram occurrences="8" value="_j" /> + <ngram occurrences="8" value="_ir_" /> + <ngram occurrences="8" value="_ir" /> + <ngram occurrences="8" value="_arî_" /> + <ngram occurrences="8" value="_arî" /> + <ngram occurrences="8" value="_____" /> + <ngram occurrences="7" value="ðana" /> + <ngram occurrences="7" value="îv" /> + <ngram occurrences="7" value="îj" /> + <ngram occurrences="7" value="îd" /> + <ngram occurrences="7" value="îbu_" /> + <ngram occurrences="7" value="îbu" /> + <ngram occurrences="7" value="zâ" /> + <ngram occurrences="7" value="zs" /> + <ngram occurrences="7" value="vçr" /> + <ngram occurrences="7" value="var" /> + <ngram occurrences="7" value="vai_" /> + <ngram occurrences="7" value="us_" /> + <ngram occurrences="7" value="ur" /> + <ngram occurrences="7" value="u_v" /> + <ngram occurrences="7" value="tç" /> + <ngram occurrences="7" value="tas_" /> + <ngram occurrences="7" value="tas" /> + <ngram occurrences="7" value="sts_" /> + <ngram occurrences="7" value="sts" /> + <ngram occurrences="7" value="sta" /> + <ngram occurrences="7" value="s_ar" /> + <ngram occurrences="7" value="ras" /> + <ngram occurrences="7" value="pu" /> + <ngram occurrences="7" value="par_" /> + <ngram occurrences="7" value="nta" /> + <ngram occurrences="7" value="not" /> + <ngram occurrences="7" value="nis" /> + <ngram occurrences="7" value="nes" /> + <ngram occurrences="7" value="mie" /> + <ngram occurrences="7" value="ment" /> + <ngram occurrences="7" value="likum" /> + <ngram occurrences="7" value="liku" /> + <ngram occurrences="7" value="lik" /> + <ngram occurrences="7" value="ldî" /> + <ngram occurrences="7" value="lai" /> + <ngram occurrences="7" value="kas_" /> + <ngram occurrences="7" value="kas" /> + <ngram occurrences="7" value="k_" /> + <ngram occurrences="7" value="isk" /> + <ngram occurrences="7" value="isi" /> + <ngram occurrences="7" value="im" /> + <ngram occurrences="7" value="ieð" /> + <ngram occurrences="7" value="iet" /> + <ngram occurrences="7" value="er" /> + <ngram occurrences="7" value="ec" /> + <ngram occurrences="7" value="du" /> + <ngram occurrences="7" value="cij" /> + <ngram occurrences="7" value="bu_" /> + <ngram occurrences="7" value="bu" /> + <ngram occurrences="7" value="as_v" /> + <ngram occurrences="7" value="as_n" /> + <ngram occurrences="7" value="alst" /> + <ngram occurrences="7" value="als" /> + <ngram occurrences="7" value="aks" /> + <ngram occurrences="7" value="a_un_" /> + <ngram occurrences="7" value="a_un" /> +</ngrams> diff --git a/src/plugins/language/lithuanian.klp b/src/plugins/language/lithuanian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="766" value="_" /> + <ngram occurrences="549" value="i" /> + <ngram occurrences="494" value="a" /> + <ngram occurrences="341" value="s" /> + <ngram occurrences="216" value="t" /> + <ngram occurrences="216" value="o" /> + <ngram occurrences="213" value="r" /> + <ngram occurrences="211" value="u" /> + <ngram occurrences="208" value="e" /> + <ngram occurrences="197" value="n" /> + <ngram occurrences="192" value="k" /> + <ngram occurrences="148" value="l" /> + <ngram occurrences="146" value="s_" /> + <ngram occurrences="134" value="p" /> + <ngram occurrences="128" value="i_" /> + <ngram occurrences="115" value="d" /> + <ngram occurrences="110" value="m" /> + <ngram occurrences="106" value="v" /> + <ngram occurrences="103" value="ó" /> + <ngram occurrences="95" value="o_" /> + <ngram occurrences="80" value="g" /> + <ngram occurrences="80" value="ai" /> + <ngram occurrences="78" value="_p" /> + <ngram occurrences="74" value="_k" /> + <ngram occurrences="73" value="_i" /> + <ngram occurrences="71" value="ý" /> + <ngram occurrences="71" value="j" /> + <ngram occurrences="67" value="_s" /> + <ngram occurrences="66" value="_n" /> + <ngram occurrences="65" value="as" /> + <ngram occurrences="64" value="a_" /> + <ngram occurrences="61" value="is" /> + <ngram occurrences="60" value="ta" /> + <ngram occurrences="60" value="b" /> + <ngram occurrences="60" value="_v" /> + <ngram occurrences="59" value="_t" /> + <ngram occurrences="58" value="si" /> + <ngram occurrences="55" value="y" /> + <ngram occurrences="55" value="au" /> + <ngram occurrences="53" value="ia" /> + <ngram occurrences="52" value="ir" /> + <ngram occurrences="51" value="pa" /> + <ngram occurrences="49" value="ne" /> + <ngram occurrences="47" value="r_" /> + <ngram occurrences="45" value="u_" /> + <ngram occurrences="45" value="ka" /> + <ngram occurrences="43" value="_ne" /> + <ngram occurrences="42" value="ti" /> + <ngram occurrences="42" value="ie" /> + <ngram occurrences="42" value="ai_" /> + <ngram occurrences="42" value="_pa" /> + <ngram occurrences="41" value="li" /> + <ngram occurrences="40" value="is_" /> + <ngram occurrences="40" value="e_" /> + <ngram occurrences="40" value="as_" /> + <ngram occurrences="40" value="_a" /> + <ngram occurrences="38" value="in" /> + <ngram occurrences="38" value="ar" /> + <ngram occurrences="37" value="vi" /> + <ngram occurrences="36" value="ra" /> + <ngram occurrences="36" value="da" /> + <ngram occurrences="36" value="_ir" /> + <ngram occurrences="36" value="_d" /> + <ngram occurrences="34" value="st" /> + <ngram occurrences="34" value="ri" /> + <ngram occurrences="33" value="ý_" /> + <ngram occurrences="33" value="us" /> + <ngram occurrences="33" value="am" /> + <ngram occurrences="32" value="ir_" /> + <ngram occurrences="32" value="_vi" /> + <ngram occurrences="32" value="_ir_" /> + <ngram occurrences="31" value="ó_" /> + <ngram occurrences="31" value="ik" /> + <ngram occurrences="31" value="_j" /> + <ngram occurrences="29" value="an" /> + <ngram occurrences="29" value="al" /> + <ngram occurrences="28" value="ma" /> + <ngram occurrences="28" value="ko" /> + <ngram occurrences="28" value="_ta" /> + <ngram occurrences="27" value="ù" /> + <ngram occurrences="26" value="ù_" /> + <ngram occurrences="26" value="su" /> + <ngram occurrences="25" value="õ" /> + <ngram occurrences="25" value="en" /> + <ngram occurrences="24" value="ßi" /> + <ngram occurrences="24" value="ß" /> + <ngram occurrences="24" value="uo" /> + <ngram occurrences="24" value="ki" /> + <ngram occurrences="24" value="_b" /> + <ngram occurrences="23" value="sa" /> + <ngram occurrences="23" value="_ka" /> + <ngram occurrences="23" value="_i_" /> + <ngram occurrences="22" value="pr" /> + <ngram occurrences="22" value="os" /> + <ngram occurrences="22" value="na" /> + <ngram occurrences="22" value="la" /> + <ngram occurrences="22" value="_m" /> + <ngram occurrences="22" value="_l" /> + <ngram occurrences="21" value="to" /> + <ngram occurrences="21" value="mi" /> + <ngram occurrences="21" value="ga" /> + <ngram occurrences="21" value="es" /> + <ngram occurrences="21" value="_g" /> + <ngram occurrences="20" value="nu" /> + <ngram occurrences="20" value="ni" /> + <ngram occurrences="20" value="at" /> + <ngram occurrences="19" value="õ_" /> + <ngram occurrences="19" value="ti_" /> + <ngram occurrences="19" value="mo" /> + <ngram occurrences="19" value="jo" /> + <ngram occurrences="19" value="iu" /> + <ngram occurrences="19" value="il" /> + <ngram occurrences="19" value="er" /> + <ngram occurrences="19" value="el" /> + <ngram occurrences="19" value="au_" /> + <ngram occurrences="19" value="_su" /> + <ngram occurrences="18" value="ñ" /> + <ngram occurrences="18" value="va" /> + <ngram occurrences="18" value="ur" /> + <ngram occurrences="18" value="ei" /> + <ngram occurrences="18" value="ama" /> + <ngram occurrences="17" value="ve" /> + <ngram occurrences="17" value="us_" /> + <ngram occurrences="17" value="tai" /> + <ngram occurrences="17" value="s_i" /> + <ngram occurrences="17" value="ja" /> + <ngram occurrences="17" value="i_k" /> + <ngram occurrences="17" value="_pr" /> + <ngram occurrences="16" value="ól" /> + <ngram occurrences="16" value="ój" /> + <ngram occurrences="16" value="ßia" /> + <ngram occurrences="16" value="sta" /> + <ngram occurrences="16" value="s_p" /> + <ngram occurrences="16" value="od" /> + <ngram occurrences="16" value="jo_" /> + <ngram occurrences="16" value="ip" /> + <ngram occurrences="16" value="im" /> + <ngram occurrences="16" value="iau" /> + <ngram occurrences="16" value="dó" /> + <ngram occurrences="16" value="di" /> + <ngram occurrences="15" value="vis" /> + <ngram occurrences="15" value="s_n" /> + <ngram occurrences="15" value="pri" /> + <ngram occurrences="15" value="nt" /> + <ngram occurrences="15" value="mas" /> + <ngram occurrences="15" value="ló" /> + <ngram occurrences="15" value="ku" /> + <ngram occurrences="15" value="iai" /> + <ngram occurrences="15" value="i_p" /> + <ngram occurrences="15" value="be" /> + <ngram occurrences="15" value="_vis" /> + <ngram occurrences="15" value="_r" /> + <ngram occurrences="15" value="_ko" /> + <ngram occurrences="14" value="ós" /> + <ngram occurrences="14" value="ñ_" /> + <ngram occurrences="14" value="ul" /> + <ngram occurrences="14" value="uk" /> + <ngram occurrences="14" value="t_" /> + <ngram occurrences="14" value="s_s" /> + <ngram occurrences="14" value="oj" /> + <ngram occurrences="14" value="io" /> + <ngram occurrences="14" value="et" /> + <ngram occurrences="14" value="asi" /> + <ngram occurrences="14" value="ad" /> + <ngram occurrences="14" value="_o" /> + <ngram occurrences="14" value="_da" /> + <ngram occurrences="13" value="û" /> + <ngram occurrences="13" value="si_" /> + <ngram occurrences="13" value="s_t" /> + <ngram occurrences="13" value="ro" /> + <ngram occurrences="13" value="pas" /> + <ngram occurrences="13" value="os_" /> + <ngram occurrences="13" value="it" /> + <ngram occurrences="13" value="i_v" /> + <ngram occurrences="13" value="i_t" /> + <ngram occurrences="13" value="gi" /> + <ngram occurrences="13" value="ba" /> + <ngram occurrences="13" value="ak" /> + <ngram occurrences="12" value="ýi" /> + <ngram occurrences="12" value="vo" /> + <ngram occurrences="12" value="vie" /> + <ngram occurrences="12" value="tu" /> + <ngram occurrences="12" value="sk" /> + <ngram occurrences="12" value="p_" /> + <ngram occurrences="12" value="om" /> + <ngram occurrences="12" value="no" /> + <ngram occurrences="12" value="ke" /> + <ngram occurrences="12" value="ji" /> + <ngram occurrences="12" value="iai_" /> + <ngram occurrences="12" value="du" /> + <ngram occurrences="12" value="amas" /> + <ngram occurrences="12" value="_pri" /> + <ngram occurrences="12" value="_nu" /> + <ngram occurrences="11" value="ós_" /> + <ngram occurrences="11" value="s_v" /> + <ngram occurrences="11" value="rt" /> + <ngram occurrences="11" value="on" /> + <ngram occurrences="11" value="ne_" /> + <ngram occurrences="11" value="na_" /> + <ngram occurrences="11" value="mas_" /> + <ngram occurrences="11" value="lo" /> + <ngram occurrences="11" value="kó" /> + <ngram occurrences="11" value="ko_" /> + <ngram occurrences="11" value="k_" /> + <ngram occurrences="11" value="ien" /> + <ngram occurrences="11" value="ie_" /> + <ngram occurrences="11" value="iau_" /> + <ngram occurrences="11" value="i_n" /> + <ngram occurrences="11" value="ek" /> + <ngram occurrences="11" value="dam" /> + <ngram occurrences="11" value="_vie" /> + <ngram occurrences="11" value="_pas" /> + <ngram occurrences="11" value="_o_" /> + <ngram occurrences="11" value="_la" /> + <ngram occurrences="10" value="z" /> + <ngram occurrences="10" value="yt" /> + <ngram occurrences="10" value="usi" /> + <ngram occurrences="10" value="ug" /> + <ngram occurrences="10" value="só" /> + <ngram occurrences="10" value="s_ne" /> + <ngram occurrences="10" value="rd" /> + <ngram occurrences="10" value="ol" /> + <ngram occurrences="10" value="ok" /> + <ngram occurrences="10" value="o_v" /> + <ngram occurrences="10" value="o_k" /> + <ngram occurrences="10" value="ng" /> + <ngram occurrences="10" value="ly" /> + <ngram occurrences="10" value="iù_" /> + <ngram occurrences="10" value="iù" /> + <ngram occurrences="10" value="iu_" /> + <ngram occurrences="10" value="ies" /> + <ngram occurrences="10" value="ia_" /> + <ngram occurrences="10" value="i_s" /> + <ngram occurrences="10" value="go" /> + <ngram occurrences="10" value="ep" /> + <ngram occurrences="10" value="ap" /> + <ngram occurrences="10" value="ant" /> + <ngram occurrences="10" value="aip" /> + <ngram occurrences="10" value="aik" /> + <ngram occurrences="10" value="_ý" /> + <ngram occurrences="10" value="_õ" /> + <ngram occurrences="10" value="_va" /> + <ngram occurrences="10" value="_ti" /> + <ngram occurrences="10" value="_sa" /> + <ngram occurrences="10" value="_ku" /> + <ngram occurrences="10" value="_ji" /> + <ngram occurrences="9" value="ód" /> + <ngram occurrences="9" value="yr" /> + <ngram occurrences="9" value="vy" /> + <ngram occurrences="9" value="um" /> + <ngram occurrences="9" value="tý" /> + <ngram occurrences="9" value="tó" /> + <ngram occurrences="9" value="ty" /> + <ngram occurrences="9" value="tik" /> + <ngram occurrences="9" value="tai_" /> + <ngram occurrences="9" value="sau" /> + <ngram occurrences="9" value="s_ta" /> + <ngram occurrences="9" value="s_pa" /> + <ngram occurrences="9" value="s_k" /> + <ngram occurrences="9" value="s_ir" /> + <ngram occurrences="9" value="rie" /> + <ngram occurrences="9" value="re" /> + <ngram occurrences="9" value="r_p" /> + <ngram occurrences="9" value="pi" /> + <ngram occurrences="9" value="o_s" /> + <ngram occurrences="9" value="o_p" /> + <ngram occurrences="9" value="nó" /> + <ngram occurrences="9" value="nk" /> + <ngram occurrences="9" value="n_" /> + <ngram occurrences="9" value="me" /> + <ngram occurrences="9" value="kel" /> + <ngram occurrences="9" value="id" /> + <ngram occurrences="9" value="i_i" /> + <ngram occurrences="9" value="eli" /> + <ngram occurrences="9" value="dama" /> + <ngram occurrences="9" value="bu" /> + <ngram occurrences="9" value="aßi" /> + <ngram occurrences="9" value="aß" /> + <ngram occurrences="9" value="av" /> + <ngram occurrences="9" value="aul" /> + <ngram occurrences="9" value="ais" /> + <ngram occurrences="9" value="ag" /> + <ngram occurrences="9" value="ab" /> + <ngram occurrences="9" value="_st" /> + <ngram occurrences="9" value="_sk" /> + <ngram occurrences="9" value="_be" /> + <ngram occurrences="9" value="_ar" /> + <ngram occurrences="8" value="ßiau" /> + <ngram occurrences="8" value="vó" /> + <ngram occurrences="8" value="vien" /> + <ngram occurrences="8" value="un" /> + <ngram occurrences="8" value="u_p" /> + <ngram occurrences="8" value="tý_" /> + <ngram occurrences="8" value="ts" /> + <ngram occurrences="8" value="tr" /> + <ngram occurrences="8" value="tas" /> + <ngram occurrences="8" value="se" /> + <ngram occurrences="8" value="saul" /> + <ngram occurrences="8" value="s_j" /> + <ngram occurrences="8" value="s_ir_" /> + <ngram occurrences="8" value="s_g" /> + <ngram occurrences="8" value="rie_" /> + <ngram occurrences="8" value="ra_" /> + <ngram occurrences="8" value="pu" /> + <ngram occurrences="8" value="prie" /> + <ngram occurrences="8" value="nuo" /> + <ngram occurrences="8" value="m_" /> + <ngram occurrences="8" value="ks" /> + <ngram occurrences="8" value="kr" /> + <ngram occurrences="8" value="kai" /> + <ngram occurrences="8" value="ju" /> + <ngram occurrences="8" value="je" /> + <ngram occurrences="8" value="iý" /> + <ngram occurrences="8" value="ip_" /> + <ngram occurrences="8" value="i_pa" /> + <ngram occurrences="8" value="gu" /> + <ngram occurrences="8" value="damas" /> + <ngram occurrences="8" value="d_" /> + <ngram occurrences="8" value="aus" /> + <ngram occurrences="8" value="ats" /> + <ngram occurrences="8" value="amas_" /> + <ngram occurrences="8" value="ali" /> + <ngram occurrences="8" value="aip_" /> + <ngram occurrences="8" value="ad_" /> + <ngram occurrences="8" value="_õ_" /> + <ngram occurrences="8" value="_vien" /> + <ngram occurrences="8" value="_tai" /> + <ngram occurrences="8" value="_sta" /> + <ngram occurrences="8" value="_prie" /> + <ngram occurrences="8" value="_ne_" /> + <ngram occurrences="8" value="_ju" /> + <ngram occurrences="8" value="_at" /> + <ngram occurrences="7" value="ö" /> + <ngram occurrences="7" value="ßiau_" /> + <ngram occurrences="7" value="yn" /> + <ngram occurrences="7" value="yd" /> + <ngram occurrences="7" value="vo_" /> + <ngram occurrences="7" value="uv" /> + <ngram occurrences="7" value="ut" /> + <ngram occurrences="7" value="u_n" /> + <ngram occurrences="7" value="to_" /> + <ngram occurrences="7" value="te" /> + <ngram occurrences="7" value="tas_" /> + <ngram occurrences="7" value="ta_" /> + <ngram occurrences="7" value="siu" /> + <ngram occurrences="7" value="sis" /> + <ngram occurrences="7" value="rp" /> + <ngram occurrences="7" value="r_n" /> + <ngram occurrences="7" value="prie_" /> + <ngram occurrences="7" value="pe" /> + <ngram occurrences="7" value="ojo" /> + <ngram occurrences="7" value="o_i" /> + <ngram occurrences="7" value="ný_" /> + <ngram occurrences="7" value="ný" /> + <ngram occurrences="7" value="nep" /> + <ngram occurrences="7" value="lik" /> + <ngram occurrences="7" value="lia" /> + <ngram occurrences="7" value="lai" /> + <ngram occurrences="7" value="l_" /> + <ngram occurrences="7" value="keli" /> + <ngram occurrences="7" value="kar" /> + <ngram occurrences="7" value="kad_" /> + <ngram occurrences="7" value="kad" /> + <ngram occurrences="7" value="jau" /> + <ngram occurrences="7" value="io_" /> + <ngram occurrences="7" value="gal" /> + <ngram occurrences="7" value="g_" /> + <ngram occurrences="7" value="dar" /> + <ngram occurrences="7" value="aßiau" /> + <ngram occurrences="7" value="aßia" /> + <ngram occurrences="7" value="aug" /> + <ngram occurrences="7" value="ar_" /> + <ngram occurrences="7" value="ais_" /> + <ngram occurrences="7" value="ai_k" /> + <ngram occurrences="7" value="_ö" /> + <ngram occurrences="7" value="_vy" /> + <ngram occurrences="7" value="_ra" /> + <ngram occurrences="7" value="_nuo" /> + <ngram occurrences="7" value="_nep" /> + <ngram occurrences="7" value="_kr" /> + <ngram occurrences="7" value="_kel" /> + <ngram occurrences="7" value="_ke" /> + <ngram occurrences="7" value="_ga" /> + <ngram occurrences="7" value="_bu" /> + <ngram occurrences="7" value="_ats" /> + <ngram occurrences="6" value="ýe" /> + <ngram occurrences="6" value="ý_s" /> + <ngram occurrences="6" value="ót" /> + <ngram occurrences="6" value="ól_" /> + <ngram occurrences="6" value="ójo_" /> + <ngram occurrences="6" value="ójo" /> + <ngram occurrences="6" value="ó_k" /> + <ngram occurrences="6" value="ó_i" /> + <ngram occurrences="6" value="ßia_" /> + <ngram occurrences="6" value="yra" /> + <ngram occurrences="6" value="uol" /> + <ngram occurrences="6" value="uli" /> + <ngram occurrences="6" value="u_i" /> + <ngram occurrences="6" value="tù" /> + <ngram occurrences="6" value="taßia" /> +</ngrams> diff --git a/src/plugins/language/malay.klp b/src/plugins/language/malay.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="842" value="a" /> + <ngram occurrences="735" value="_" /> + <ngram occurrences="408" value="n" /> + <ngram occurrences="321" value="e" /> + <ngram occurrences="297" value="i" /> + <ngram occurrences="242" value="an" /> + <ngram occurrences="223" value="k" /> + <ngram occurrences="194" value="d" /> + <ngram occurrences="177" value="t" /> + <ngram occurrences="177" value="r" /> + <ngram occurrences="176" value="u" /> + <ngram occurrences="176" value="m" /> + <ngram occurrences="163" value="g" /> + <ngram occurrences="151" value="s" /> + <ngram occurrences="151" value="n_" /> + <ngram occurrences="133" value="an_" /> + <ngram occurrences="128" value="p" /> + <ngram occurrences="127" value="l" /> + <ngram occurrences="122" value="a_" /> + <ngram occurrences="116" value="ng" /> + <ngram occurrences="116" value="b" /> + <ngram occurrences="110" value="da" /> + <ngram occurrences="109" value="_d" /> + <ngram occurrences="103" value="h" /> + <ngram occurrences="86" value="ka" /> + <ngram occurrences="82" value="_m" /> + <ngram occurrences="79" value="i_" /> + <ngram occurrences="74" value="y" /> + <ngram occurrences="74" value="ang" /> + <ngram occurrences="69" value="en" /> + <ngram occurrences="64" value="ya" /> + <ngram occurrences="62" value="la" /> + <ngram occurrences="62" value="ah" /> + <ngram occurrences="62" value="_s" /> + <ngram occurrences="61" value="er" /> + <ngram occurrences="61" value="_k" /> + <ngram occurrences="60" value="ng_" /> + <ngram occurrences="60" value="me" /> + <ngram occurrences="60" value="g_" /> + <ngram occurrences="59" value="o" /> + <ngram occurrences="59" value="__" /> + <ngram occurrences="58" value="___" /> + <ngram occurrences="57" value="_b" /> + <ngram occurrences="57" value="____" /> + <ngram occurrences="56" value="ar" /> + <ngram occurrences="56" value="_____" /> + <ngram occurrences="55" value="ra" /> + <ngram occurrences="55" value="ang_" /> + <ngram occurrences="55" value="_me" /> + <ngram occurrences="55" value="_da" /> + <ngram occurrences="54" value="di" /> + <ngram occurrences="53" value="at" /> + <ngram occurrences="51" value="ba" /> + <ngram occurrences="50" value="_p" /> + <ngram occurrences="49" value="h_" /> + <ngram occurrences="47" value="al" /> + <ngram occurrences="46" value="ak" /> + <ngram occurrences="45" value="ta" /> + <ngram occurrences="45" value="_a" /> + <ngram occurrences="44" value="se" /> + <ngram occurrences="44" value="ga" /> + <ngram occurrences="43" value="kan" /> + <ngram occurrences="42" value="ke" /> + <ngram occurrences="42" value="kan_" /> + <ngram occurrences="42" value="k_" /> + <ngram occurrences="40" value="sa" /> + <ngram occurrences="40" value="_di" /> + <ngram occurrences="39" value="pa" /> + <ngram occurrences="39" value="ah_" /> + <ngram occurrences="38" value="j" /> + <ngram occurrences="38" value="_t" /> + <ngram occurrences="37" value="pe" /> + <ngram occurrences="37" value="in" /> + <ngram occurrences="37" value="as" /> + <ngram occurrences="37" value="am" /> + <ngram occurrences="36" value="dan" /> + <ngram occurrences="34" value="c" /> + <ngram occurrences="34" value="_ke" /> + <ngram occurrences="33" value="yang_" /> + <ngram occurrences="33" value="yang" /> + <ngram occurrences="33" value="yan" /> + <ngram occurrences="33" value="ti" /> + <ngram occurrences="33" value="em" /> + <ngram occurrences="33" value="be" /> + <ngram occurrences="33" value="_se" /> + <ngram occurrences="32" value="u_" /> + <ngram occurrences="32" value="ma" /> + <ngram occurrences="32" value="_yang" /> + <ngram occurrences="32" value="_yan" /> + <ngram occurrences="32" value="_ya" /> + <ngram occurrences="32" value="_y" /> + <ngram occurrences="31" value="ha" /> + <ngram occurrences="30" value="it" /> + <ngram occurrences="30" value="_dan" /> + <ngram occurrences="29" value="tu" /> + <ngram occurrences="29" value="t_" /> + <ngram occurrences="29" value="r_" /> + <ngram occurrences="29" value="men" /> + <ngram occurrences="29" value="el" /> + <ngram occurrences="29" value="_pe" /> + <ngram occurrences="28" value="ala" /> + <ngram occurrences="27" value="te" /> + <ngram occurrences="27" value="ik" /> + <ngram occurrences="27" value="dan_" /> + <ngram occurrences="27" value="_men" /> + <ngram occurrences="27" value="_dan_" /> + <ngram occurrences="26" value="un" /> + <ngram occurrences="25" value="nd" /> + <ngram occurrences="25" value="na" /> + <ngram occurrences="25" value="ia" /> + <ngram occurrences="24" value="si" /> + <ngram occurrences="24" value="ri" /> + <ngram occurrences="24" value="ny" /> + <ngram occurrences="24" value="li" /> + <ngram occurrences="24" value="ad" /> + <ngram occurrences="24" value="_i" /> + <ngram occurrences="24" value="_ba" /> + <ngram occurrences="23" value="ja" /> + <ngram occurrences="22" value="w" /> + <ngram occurrences="22" value="nga" /> + <ngram occurrences="22" value="ap" /> + <ngram occurrences="22" value="_be" /> + <ngram occurrences="21" value="nya" /> + <ngram occurrences="21" value="n_d" /> + <ngram occurrences="21" value="m_" /> + <ngram occurrences="21" value="ep" /> + <ngram occurrences="21" value="eng" /> + <ngram occurrences="20" value="n_k" /> + <ngram occurrences="20" value="mb" /> + <ngram occurrences="20" value="ber" /> + <ngram occurrences="20" value="ada" /> + <ngram occurrences="19" value="wa" /> + <ngram occurrences="19" value="da_" /> + <ngram occurrences="19" value="at_" /> + <ngram occurrences="19" value="an_k" /> + <ngram occurrences="19" value="an_d" /> + <ngram occurrences="19" value="aka" /> + <ngram occurrences="19" value="ak_" /> + <ngram occurrences="18" value="ua" /> + <ngram occurrences="18" value="et" /> + <ngram occurrences="18" value="ara" /> + <ngram occurrences="17" value="ya_" /> + <ngram occurrences="17" value="uk" /> + <ngram occurrences="17" value="tu_" /> + <ngram occurrences="17" value="ran" /> + <ngram occurrences="17" value="pu" /> + <ngram occurrences="17" value="per" /> + <ngram occurrences="17" value="nda" /> + <ngram occurrences="17" value="mem" /> + <ngram occurrences="17" value="ek" /> + <ngram occurrences="17" value="ata" /> + <ngram occurrences="17" value="ai" /> + <ngram occurrences="17" value="ada_" /> + <ngram occurrences="17" value="a_d" /> + <ngram occurrences="17" value="_te" /> + <ngram occurrences="17" value="_mem" /> + <ngram occurrences="17" value="_c" /> + <ngram occurrences="16" value="nya_" /> + <ngram occurrences="16" value="ngk" /> + <ngram occurrences="16" value="lam" /> + <ngram occurrences="16" value="ir" /> + <ngram occurrences="16" value="gk" /> + <ngram occurrences="16" value="am_" /> + <ngram occurrences="16" value="aha" /> + <ngram occurrences="16" value="a_m" /> + <ngram occurrences="16" value="_ma" /> + <ngram occurrences="16" value="_ber" /> + <ngram occurrences="15" value="ur" /> + <ngram occurrences="15" value="s_" /> + <ngram occurrences="15" value="mu" /> + <ngram occurrences="15" value="lah" /> + <ngram occurrences="15" value="ki" /> + <ngram occurrences="15" value="end" /> + <ngram occurrences="15" value="eb" /> + <ngram occurrences="15" value="de" /> + <ngram occurrences="15" value="dal" /> + <ngram occurrences="15" value="a_p" /> + <ngram occurrences="14" value="tan" /> + <ngram occurrences="14" value="pada_" /> + <ngram occurrences="14" value="pada" /> + <ngram occurrences="14" value="pad" /> + <ngram occurrences="14" value="p_" /> + <ngram occurrences="14" value="ngan" /> + <ngram occurrences="14" value="n_s" /> + <ngram occurrences="14" value="n_p" /> + <ngram occurrences="14" value="le" /> + <ngram occurrences="14" value="lah_" /> + <ngram occurrences="14" value="ku" /> + <ngram occurrences="14" value="il" /> + <ngram occurrences="14" value="id" /> + <ngram occurrences="14" value="h_d" /> + <ngram occurrences="14" value="gi" /> + <ngram occurrences="14" value="gan" /> + <ngram occurrences="14" value="f" /> + <ngram occurrences="14" value="ban" /> + <ngram occurrences="14" value="asa" /> + <ngram occurrences="14" value="ar_" /> + <ngram occurrences="14" value="an_s" /> + <ngram occurrences="14" value="_sa" /> + <ngram occurrences="14" value="_n" /> + <ngram occurrences="13" value="ut" /> + <ngram occurrences="13" value="ni" /> + <ngram occurrences="13" value="ngka" /> + <ngram occurrences="13" value="ngan_" /> + <ngram occurrences="13" value="n_m" /> + <ngram occurrences="13" value="n_ke" /> + <ngram occurrences="13" value="mp" /> + <ngram occurrences="13" value="ing" /> + <ngram occurrences="13" value="gka" /> + <ngram occurrences="13" value="gan_" /> + <ngram occurrences="13" value="era" /> + <ngram occurrences="13" value="di_" /> + <ngram occurrences="13" value="dar" /> + <ngram occurrences="13" value="dala" /> + <ngram occurrences="13" value="ca" /> + <ngram occurrences="13" value="ay" /> + <ngram occurrences="13" value="ari" /> + <ngram occurrences="13" value="a_k" /> + <ngram occurrences="12" value="us" /> + <ngram occurrences="12" value="ter" /> + <ngram occurrences="12" value="pi" /> + <ngram occurrences="12" value="n_b" /> + <ngram occurrences="12" value="itu_" /> + <ngram occurrences="12" value="itu" /> + <ngram occurrences="12" value="es" /> + <ngram occurrences="12" value="enga" /> + <ngram occurrences="12" value="ela" /> + <ngram occurrences="12" value="an_p" /> + <ngram occurrences="12" value="an_ke" /> + <ngram occurrences="12" value="alam" /> + <ngram occurrences="12" value="ag" /> + <ngram occurrences="12" value="_j" /> + <ngram occurrences="11" value="ri_" /> + <ngram occurrences="11" value="pat" /> + <ngram occurrences="11" value="nt" /> + <ngram occurrences="11" value="n_a" /> + <ngram occurrences="11" value="lam_" /> + <ngram occurrences="11" value="ka_" /> + <ngram occurrences="11" value="ika" /> + <ngram occurrences="11" value="ih" /> + <ngram occurrences="11" value="i_d" /> + <ngram occurrences="11" value="emb" /> + <ngram occurrences="11" value="dalam" /> + <ngram occurrences="11" value="bu" /> + <ngram occurrences="11" value="bi" /> + <ngram occurrences="11" value="au" /> + <ngram occurrences="11" value="apa" /> + <ngram occurrences="11" value="alam_" /> + <ngram occurrences="11" value="a_t" /> + <ngram occurrences="11" value="_ti" /> + <ngram occurrences="11" value="_r" /> + <ngram occurrences="11" value="_l" /> + <ngram occurrences="11" value="_h" /> + <ngram occurrences="11" value="_de" /> + <ngram occurrences="11" value="_dala" /> + <ngram occurrences="11" value="_dal" /> + <ngram occurrences="11" value="_ban" /> + <ngram occurrences="10" value="ti_" /> + <ngram occurrences="10" value="seb" /> + <ngram occurrences="10" value="on" /> + <ngram occurrences="10" value="ng_m" /> + <ngram occurrences="10" value="ne" /> + <ngram occurrences="10" value="n_me" /> + <ngram occurrences="10" value="mba" /> + <ngram occurrences="10" value="lan" /> + <ngram occurrences="10" value="ko" /> + <ngram occurrences="10" value="g_m" /> + <ngram occurrences="10" value="epa" /> + <ngram occurrences="10" value="enda" /> + <ngram occurrences="10" value="ed" /> + <ngram occurrences="10" value="dak" /> + <ngram occurrences="10" value="atan" /> + <ngram occurrences="10" value="asi" /> + <ngram occurrences="10" value="angk" /> + <ngram occurrences="10" value="and" /> + <ngram occurrences="10" value="an_m" /> + <ngram occurrences="10" value="an_b" /> + <ngram occurrences="10" value="an_a" /> + <ngram occurrences="10" value="ali" /> + <ngram occurrences="10" value="akan_" /> + <ngram occurrences="10" value="akan" /> + <ngram occurrences="10" value="a_me" /> + <ngram occurrences="10" value="_per" /> + <ngram occurrences="10" value="_ka" /> + <ngram occurrences="10" value="_itu_" /> + <ngram occurrences="10" value="_itu" /> + <ngram occurrences="10" value="_it" /> + <ngram occurrences="9" value="ta_" /> + <ngram occurrences="9" value="su" /> + <ngram occurrences="9" value="si_" /> + <ngram occurrences="9" value="sep" /> + <ngram occurrences="9" value="san" /> + <ngram occurrences="9" value="ru" /> + <ngram occurrences="9" value="rk" /> + <ngram occurrences="9" value="re" /> + <ngram occurrences="9" value="rang" /> + <ngram occurrences="9" value="pen" /> + <ngram occurrences="9" value="nj" /> + <ngram occurrences="9" value="ng_d" /> + <ngram occurrences="9" value="n_t" /> + <ngram occurrences="9" value="n_se" /> + <ngram occurrences="9" value="n_di" /> + <ngram occurrences="9" value="mi" /> + <ngram occurrences="9" value="meng" /> + <ngram occurrences="9" value="memb" /> + <ngram occurrences="9" value="is" /> + <ngram occurrences="9" value="ib" /> + <ngram occurrences="9" value="i_m" /> + <ngram occurrences="9" value="i_da" /> + <ngram occurrences="9" value="hu" /> + <ngram occurrences="9" value="g_d" /> + <ngram occurrences="9" value="eg" /> + <ngram occurrences="9" value="du" /> + <ngram occurrences="9" value="aya" /> + <ngram occurrences="9" value="awa" /> + <ngram occurrences="9" value="aw" /> + <ngram occurrences="9" value="ap_" /> + <ngram occurrences="9" value="angka" /> + <ngram occurrences="9" value="ang_m" /> + <ngram occurrences="9" value="ang_d" /> + <ngram occurrences="9" value="an_se" /> + <ngram occurrences="9" value="aj" /> + <ngram occurrences="9" value="a_da" /> + <ngram occurrences="9" value="a_b" /> + <ngram occurrences="9" value="_pen" /> + <ngram occurrences="9" value="_pa" /> + <ngram occurrences="9" value="_meng" /> + <ngram occurrences="9" value="_memb" /> + <ngram occurrences="9" value="_di_" /> + <ngram occurrences="8" value="ura" /> + <ngram occurrences="8" value="un_" /> + <ngram occurrences="8" value="um" /> + <ngram occurrences="8" value="tan_" /> + <ngram occurrences="8" value="sa_" /> + <ngram occurrences="8" value="rt" /> + <ngram occurrences="8" value="ras" /> + <ngram occurrences="8" value="ran_" /> + <ngram occurrences="8" value="ra_" /> + <ngram occurrences="8" value="pun" /> + <ngram occurrences="8" value="or" /> + <ngram occurrences="8" value="ol" /> + <ngram occurrences="8" value="nja" /> + <ngram occurrences="8" value="ng_s" /> + <ngram occurrences="8" value="n_pe" /> + <ngram occurrences="8" value="n_be" /> + <ngram occurrences="8" value="lu" /> + <ngram occurrences="8" value="l_" /> + <ngram occurrences="8" value="kan_k" /> + <ngram occurrences="8" value="kan_d" /> + <ngram occurrences="8" value="k_s" /> + <ngram occurrences="8" value="ju" /> + <ngram occurrences="8" value="ita" /> + <ngram occurrences="8" value="iha" /> + <ngram occurrences="8" value="ida" /> + <ngram occurrences="8" value="ian" /> + <ngram occurrences="8" value="i_b" /> + <ngram occurrences="8" value="h_di" /> + <ngram occurrences="8" value="g_s" /> + <ngram occurrences="8" value="eta" /> + <ngram occurrences="8" value="ert" /> + <ngram occurrences="8" value="ena" /> + <ngram occurrences="8" value="emp" /> + <ngram occurrences="8" value="eli" /> + <ngram occurrences="8" value="eh" /> + <ngram occurrences="8" value="dik" /> + <ngram occurrences="8" value="den" /> + <ngram occurrences="8" value="dari" /> + <ngram occurrences="8" value="dak_" /> + <ngram occurrences="8" value="bah" /> + <ngram occurrences="8" value="bag" /> + <ngram occurrences="8" value="atan_" /> + <ngram occurrences="8" value="ana" /> + <ngram occurrences="8" value="an_di" /> + <ngram occurrences="8" value="ai_" /> + <ngram occurrences="8" value="ah_d" /> + <ngram occurrences="8" value="aa" /> + <ngram occurrences="8" value="a_s" /> + <ngram occurrences="8" value="a_a" /> + <ngram occurrences="8" value="_w" /> + <ngram occurrences="8" value="_seb" /> + <ngram occurrences="8" value="_o" /> + <ngram occurrences="8" value="_mu" /> + <ngram occurrences="8" value="_in" /> + <ngram occurrences="7" value="ung" /> + <ngram occurrences="7" value="ul" /> + <ngram occurrences="7" value="tidak" /> + <ngram occurrences="7" value="tida" /> + <ngram occurrences="7" value="tid" /> + <ngram occurrences="7" value="t_d" /> + <ngram occurrences="7" value="pert" /> + <ngram occurrences="7" value="pat_" /> + <ngram occurrences="7" value="om" /> + <ngram occurrences="7" value="ng_me" /> + <ngram occurrences="7" value="ng_di" /> + <ngram occurrences="7" value="na_" /> + <ngram occurrences="7" value="n_da" /> + <ngram occurrences="7" value="mer" /> + <ngram occurrences="7" value="man" /> + <ngram occurrences="7" value="kepad" /> + <ngram occurrences="7" value="kepa" /> +</ngrams> diff --git a/src/plugins/language/manx.klp b/src/plugins/language/manx.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="965" value="_" /> + <ngram occurrences="490" value="e" /> + <ngram occurrences="428" value="a" /> + <ngram occurrences="344" value="y" /> + <ngram occurrences="315" value="n" /> + <ngram occurrences="308" value="h" /> + <ngram occurrences="289" value="r" /> + <ngram occurrences="265" value="o" /> + <ngram occurrences="250" value="s" /> + <ngram occurrences="210" value="i" /> + <ngram occurrences="176" value="l" /> + <ngram occurrences="166" value="y_" /> + <ngram occurrences="162" value="g" /> + <ngram occurrences="153" value="n_" /> + <ngram occurrences="137" value="t" /> + <ngram occurrences="128" value="d" /> + <ngram occurrences="105" value="_a" /> + <ngram occurrences="104" value="h_" /> + <ngram occurrences="100" value="m" /> + <ngram occurrences="93" value="sh" /> + <ngram occurrences="93" value="e_" /> + <ngram occurrences="93" value="c" /> + <ngram occurrences="90" value="_s" /> + <ngram occurrences="89" value="ee" /> + <ngram occurrences="85" value="_e" /> + <ngram occurrences="83" value="yn" /> + <ngram occurrences="82" value="gh" /> + <ngram occurrences="79" value="ag" /> + <ngram occurrences="78" value="r_" /> + <ngram occurrences="75" value="s_" /> + <ngram occurrences="74" value="oo" /> + <ngram occurrences="72" value="ey" /> + <ngram occurrences="71" value="agh" /> + <ngram occurrences="69" value="ey_" /> + <ngram occurrences="68" value="yn_" /> + <ngram occurrences="67" value="a_" /> + <ngram occurrences="67" value="_d" /> + <ngram occurrences="65" value="_c" /> + <ngram occurrences="58" value="_n" /> + <ngram occurrences="57" value="v" /> + <ngram occurrences="57" value="as" /> + <ngram occurrences="56" value="u" /> + <ngram occurrences="56" value="_m" /> + <ngram occurrences="55" value="t_" /> + <ngram occurrences="54" value="he" /> + <ngram occurrences="54" value="_v" /> + <ngram occurrences="50" value="in" /> + <ngram occurrences="49" value="ch" /> + <ngram occurrences="49" value="_y" /> + <ngram occurrences="49" value="_r" /> + <ngram occurrences="48" value="ee_" /> + <ngram occurrences="48" value="_as" /> + <ngram occurrences="47" value="oi" /> + <ngram occurrences="47" value="gh_" /> + <ngram occurrences="47" value="er" /> + <ngram occurrences="47" value="_sh" /> + <ngram occurrences="46" value="agh_" /> + <ngram occurrences="46" value="_t" /> + <ngram occurrences="44" value="ar" /> + <ngram occurrences="43" value="_ch" /> + <ngram occurrences="41" value="yr" /> + <ngram occurrences="38" value="re" /> + <ngram occurrences="38" value="ll" /> + <ngram occurrences="38" value="b" /> + <ngram occurrences="38" value="as_" /> + <ngram occurrences="38" value="_as_" /> + <ngram occurrences="37" value="ny" /> + <ngram occurrences="37" value="dy" /> + <ngram occurrences="37" value="_g" /> + <ngram occurrences="36" value="le" /> + <ngram occurrences="36" value="k" /> + <ngram occurrences="36" value="hi" /> + <ngram occurrences="36" value="ay" /> + <ngram occurrences="35" value="ha" /> + <ngram occurrences="34" value="er_" /> + <ngram occurrences="34" value="en" /> + <ngram occurrences="34" value="_l" /> + <ngram occurrences="33" value="ra" /> + <ngram occurrences="33" value="nn" /> + <ngram occurrences="33" value="f" /> + <ngram occurrences="33" value="_f" /> + <ngram occurrences="32" value="ne" /> + <ngram occurrences="32" value="is" /> + <ngram occurrences="32" value="ea" /> + <ngram occurrences="31" value="in_" /> + <ngram occurrences="31" value="an" /> + <ngram occurrences="31" value="_b" /> + <ngram occurrences="30" value="ro" /> + <ngram occurrences="30" value="oa" /> + <ngram occurrences="30" value="l_" /> + <ngram occurrences="30" value="ish" /> + <ngram occurrences="30" value="d_" /> + <ngram occurrences="30" value="_h" /> + <ngram occurrences="29" value="rr" /> + <ngram occurrences="28" value="_er" /> + <ngram occurrences="28" value="_dy" /> + <ngram occurrences="27" value="la" /> + <ngram occurrences="27" value="ht" /> + <ngram occurrences="27" value="dy_" /> + <ngram occurrences="27" value="_dy_" /> + <ngram occurrences="26" value="sh_" /> + <ngram occurrences="26" value="rt" /> + <ngram occurrences="25" value="j" /> + <ngram occurrences="25" value="ei" /> + <ngram occurrences="25" value="_ny" /> + <ngram occurrences="25" value="_er_" /> + <ngram occurrences="24" value="ny_" /> + <ngram occurrences="24" value="aa" /> + <ngram occurrences="24" value="_y_" /> + <ngram occurrences="24" value="_ny_" /> + <ngram occurrences="23" value="y_c" /> + <ngram occurrences="23" value="ooi" /> + <ngram occurrences="23" value="n_a" /> + <ngram occurrences="23" value="me" /> + <ngram occurrences="23" value="ish_" /> + <ngram occurrences="23" value="ho" /> + <ngram occurrences="22" value="o_" /> + <ngram occurrences="22" value="my" /> + <ngram occurrences="22" value="ie" /> + <ngram occurrences="22" value="_o" /> + <ngram occurrences="22" value="_j" /> + <ngram occurrences="21" value="rt_" /> + <ngram occurrences="21" value="mee_" /> + <ngram occurrences="21" value="mee" /> + <ngram occurrences="21" value="al" /> + <ngram occurrences="20" value="tr" /> + <ngram occurrences="20" value="shi" /> + <ngram occurrences="20" value="ri" /> + <ngram occurrences="20" value="m_" /> + <ngram occurrences="20" value="ia" /> + <ngram occurrences="20" value="el" /> + <ngram occurrences="19" value="y_ch" /> + <ngram occurrences="19" value="va" /> + <ngram occurrences="19" value="il" /> + <ngram occurrences="19" value="eh_" /> + <ngram occurrences="19" value="eh" /> + <ngram occurrences="19" value="_va" /> + <ngram occurrences="19" value="_tr" /> + <ngram occurrences="19" value="_mee_" /> + <ngram occurrences="19" value="_mee" /> + <ngram occurrences="19" value="_me" /> + <ngram occurrences="18" value="ta" /> + <ngram occurrences="18" value="she" /> + <ngram occurrences="18" value="p" /> + <ngram occurrences="18" value="lle" /> + <ngram occurrences="18" value="g_" /> + <ngram occurrences="18" value="do" /> + <ngram occurrences="18" value="_shi" /> + <ngram occurrences="18" value="_n_" /> + <ngram occurrences="18" value="_my" /> + <ngram occurrences="18" value="_do" /> + <ngram occurrences="18" value="_ay" /> + <ngram occurrences="17" value="ys" /> + <ngram occurrences="17" value="yr_" /> + <ngram occurrences="17" value="w" /> + <ngram occurrences="17" value="ty" /> + <ngram occurrences="17" value="on" /> + <ngram occurrences="17" value="n_s" /> + <ngram occurrences="17" value="en_" /> + <ngram occurrences="17" value="ayn" /> + <ngram occurrences="17" value="a_n" /> + <ngram occurrences="17" value="_ro" /> + <ngram occurrences="16" value="oo_" /> + <ngram occurrences="16" value="ley_" /> + <ngram occurrences="16" value="ley" /> + <ngram occurrences="16" value="ie_" /> + <ngram occurrences="16" value="che" /> + <ngram occurrences="16" value="ar_" /> + <ngram occurrences="16" value="_she" /> + <ngram occurrences="15" value="ym" /> + <ngram occurrences="15" value="ss" /> + <ngram occurrences="15" value="or" /> + <ngram occurrences="15" value="oar" /> + <ngram occurrences="15" value="ns" /> + <ngram occurrences="15" value="ni" /> + <ngram occurrences="15" value="ill" /> + <ngram occurrences="15" value="ht_" /> + <ngram occurrences="15" value="hen" /> + <ngram occurrences="15" value="h_a" /> + <ngram occurrences="15" value="ght" /> + <ngram occurrences="15" value="cha" /> + <ngram occurrences="15" value="_yn" /> + <ngram occurrences="15" value="_cha" /> + <ngram occurrences="15" value="_ayn" /> + <ngram occurrences="15" value="_ag" /> + <ngram occurrences="14" value="vo" /> + <ngram occurrences="14" value="ur" /> + <ngram occurrences="14" value="te" /> + <ngram occurrences="14" value="ree" /> + <ngram occurrences="14" value="oy" /> + <ngram occurrences="14" value="ooa" /> + <ngram occurrences="14" value="n_d" /> + <ngram occurrences="14" value="hey_" /> + <ngram occurrences="14" value="hey" /> + <ngram occurrences="14" value="es" /> + <ngram occurrences="14" value="doo" /> + <ngram occurrences="14" value="da" /> + <ngram occurrences="14" value="ayr" /> + <ngram occurrences="14" value="_yn_" /> + <ngram occurrences="14" value="_ta" /> + <ngram occurrences="14" value="_doo" /> + <ngram occurrences="14" value="_da" /> + <ngram occurrences="14" value="_agh" /> + <ngram occurrences="13" value="ys_" /> + <ngram occurrences="13" value="yrt" /> + <ngram occurrences="13" value="ym_" /> + <ngram occurrences="13" value="y_v" /> + <ngram occurrences="13" value="w_" /> + <ngram occurrences="13" value="ve" /> + <ngram occurrences="13" value="va_" /> + <ngram occurrences="13" value="tyn_" /> + <ngram occurrences="13" value="tyn" /> + <ngram occurrences="13" value="so" /> + <ngram occurrences="13" value="ooy" /> + <ngram occurrences="13" value="ooar" /> + <ngram occurrences="13" value="oil" /> + <ngram occurrences="13" value="na" /> + <ngram occurrences="13" value="mo" /> + <ngram occurrences="13" value="lley_" /> + <ngram occurrences="13" value="lley" /> + <ngram occurrences="13" value="gg" /> + <ngram occurrences="13" value="ck" /> + <ngram occurrences="13" value="aght" /> + <ngram occurrences="13" value="ae" /> + <ngram occurrences="13" value="_vo" /> + <ngram occurrences="13" value="_ve" /> + <ngram occurrences="13" value="_va_" /> + <ngram occurrences="13" value="_k" /> + <ngram occurrences="13" value="_eh_" /> + <ngram occurrences="13" value="_eh" /> + <ngram occurrences="12" value="yns" /> + <ngram occurrences="12" value="y_s" /> + <ngram occurrences="12" value="y_a" /> + <ngram occurrences="12" value="sht" /> + <ngram occurrences="12" value="s_y" /> + <ngram occurrences="12" value="ry" /> + <ngram occurrences="12" value="row_" /> + <ngram occurrences="12" value="row" /> + <ngram occurrences="12" value="ow_" /> + <ngram occurrences="12" value="ow" /> + <ngram occurrences="12" value="nni" /> + <ngram occurrences="12" value="ne_" /> + <ngram occurrences="12" value="nagh" /> + <ngram occurrences="12" value="nag" /> + <ngram occurrences="12" value="k_" /> + <ngram occurrences="12" value="je" /> + <ngram occurrences="12" value="hu" /> + <ngram occurrences="12" value="ha_" /> + <ngram occurrences="12" value="h_n" /> + <ngram occurrences="12" value="h_e" /> + <ngram occurrences="12" value="gh_a" /> + <ngram occurrences="12" value="e_s" /> + <ngram occurrences="12" value="e_e" /> + <ngram occurrences="12" value="cha_" /> + <ngram occurrences="12" value="agh_a" /> + <ngram occurrences="12" value="ad" /> + <ngram occurrences="12" value="_row_" /> + <ngram occurrences="12" value="_row" /> + <ngram occurrences="12" value="_je" /> + <ngram occurrences="12" value="_che" /> + <ngram occurrences="12" value="_cha_" /> + <ngram occurrences="11" value="y_r" /> + <ngram occurrences="11" value="y_m" /> + <ngram occurrences="11" value="u_" /> + <ngram occurrences="11" value="tra" /> + <ngram occurrences="11" value="ta_" /> + <ngram occurrences="11" value="t_a" /> + <ngram occurrences="11" value="shin" /> + <ngram occurrences="11" value="ra_" /> + <ngram occurrences="11" value="r_y" /> + <ngram occurrences="11" value="oin" /> + <ngram occurrences="11" value="ney" /> + <ngram occurrences="11" value="n_t" /> + <ngram occurrences="11" value="ma" /> + <ngram occurrences="11" value="ille" /> + <ngram occurrences="11" value="hin" /> + <ngram occurrences="11" value="hee" /> + <ngram occurrences="11" value="h_d" /> + <ngram occurrences="11" value="eea" /> + <ngram occurrences="11" value="ed" /> + <ngram occurrences="11" value="eay" /> + <ngram occurrences="11" value="ayns" /> + <ngram occurrences="11" value="at" /> + <ngram occurrences="11" value="arr" /> + <ngram occurrences="11" value="aa_" /> + <ngram occurrences="11" value="_tra" /> + <ngram occurrences="11" value="_ta_" /> + <ngram occurrences="11" value="_so" /> + <ngram occurrences="11" value="_ma" /> + <ngram occurrences="11" value="_la" /> + <ngram occurrences="11" value="_ayns" /> + <ngram occurrences="11" value="_agh_" /> + <ngram occurrences="10" value="yrt_" /> + <ngram occurrences="10" value="yns_" /> + <ngram occurrences="10" value="yn_a" /> + <ngram occurrences="10" value="y_g" /> + <ngram occurrences="10" value="sy" /> + <ngram occurrences="10" value="ss_" /> + <ngram occurrences="10" value="shin_" /> + <ngram occurrences="10" value="shen" /> + <ngram occurrences="10" value="rey_" /> + <ngram occurrences="10" value="rey" /> + <ngram occurrences="10" value="ooar_" /> + <ngram occurrences="10" value="ois" /> + <ngram occurrences="10" value="oill" /> + <ngram occurrences="10" value="oar_" /> + <ngram occurrences="10" value="ns_" /> + <ngram occurrences="10" value="ney_" /> + <ngram occurrences="10" value="nagh_" /> + <ngram occurrences="10" value="n_m" /> + <ngram occurrences="10" value="n_c" /> + <ngram occurrences="10" value="n_as" /> + <ngram occurrences="10" value="myr_" /> + <ngram occurrences="10" value="myr" /> + <ngram occurrences="10" value="moo" /> + <ngram occurrences="10" value="io" /> + <ngram occurrences="10" value="id" /> + <ngram occurrences="10" value="hoo" /> + <ngram occurrences="10" value="hin_" /> + <ngram occurrences="10" value="h_as" /> + <ngram occurrences="10" value="ge" /> + <ngram occurrences="10" value="fo" /> + <ngram occurrences="10" value="fe" /> + <ngram occurrences="10" value="e_a" /> + <ngram occurrences="10" value="ayns_" /> + <ngram occurrences="10" value="ass" /> + <ngram occurrences="10" value="ann" /> + <ngram occurrences="10" value="ai" /> + <ngram occurrences="10" value="_shin" /> + <ngram occurrences="10" value="_shen" /> + <ngram occurrences="10" value="_oo" /> + <ngram occurrences="10" value="_fo" /> + <ngram occurrences="10" value="_fe" /> + <ngram occurrences="9" value="yl" /> + <ngram occurrences="9" value="y_l" /> + <ngram occurrences="9" value="y_j" /> + <ngram occurrences="9" value="y_h" /> + <ngram occurrences="9" value="v_e" /> + <ngram occurrences="9" value="v_" /> + <ngram occurrences="9" value="tey_" /> + <ngram occurrences="9" value="tey" /> + <ngram occurrences="9" value="st" /> + <ngram occurrences="9" value="sho" /> + <ngram occurrences="9" value="shen_" /> + <ngram occurrences="9" value="s_s" /> + <ngram occurrences="9" value="roo" /> + <ngram occurrences="9" value="rish" /> + <ngram occurrences="9" value="ris" /> + <ngram occurrences="9" value="ooin" /> + <ngram occurrences="9" value="oish_" /> + <ngram occurrences="9" value="oish" /> + <ngram occurrences="9" value="li" /> + <ngram occurrences="9" value="lh" /> + <ngram occurrences="9" value="lag" /> + <ngram occurrences="9" value="ki" /> + <ngram occurrences="9" value="illey" /> + <ngram occurrences="9" value="ick" /> + <ngram occurrences="9" value="ic" /> + <ngram occurrences="9" value="hur" /> + <ngram occurrences="9" value="hen_" /> + <ngram occurrences="9" value="gh_as" /> + <ngram occurrences="9" value="ey_m" /> + <ngram occurrences="9" value="enn" /> + <ngram occurrences="9" value="eg" /> + <ngram occurrences="9" value="eer" /> + <ngram occurrences="9" value="dd" /> + <ngram occurrences="9" value="ass_" /> + <ngram occurrences="9" value="al_" /> + <ngram occurrences="9" value="_v_e" /> + <ngram occurrences="9" value="_v_" /> + <ngram occurrences="9" value="_myr_" /> + <ngram occurrences="9" value="_myr" /> + <ngram occurrences="9" value="_lh" /> + <ngram occurrences="9" value="_ad" /> + <ngram occurrences="8" value="yn_m" /> + <ngram occurrences="8" value="y_t" /> + <ngram occurrences="8" value="y_as" /> + <ngram occurrences="8" value="voish" /> + <ngram occurrences="8" value="vois" /> + <ngram occurrences="8" value="voi" /> + <ngram occurrences="8" value="t_m" /> + <ngram occurrences="8" value="sht_" /> + <ngram occurrences="8" value="se" /> + <ngram occurrences="8" value="s_d" /> + <ngram occurrences="8" value="rish_" /> + <ngram occurrences="8" value="ree_" /> + <ngram occurrences="8" value="rag" /> + <ngram occurrences="8" value="oille" /> + <ngram occurrences="8" value="oie_" /> + <ngram occurrences="8" value="oie" /> + <ngram occurrences="8" value="od" /> + <ngram occurrences="8" value="nyn_" /> + <ngram occurrences="8" value="nyn" /> + <ngram occurrences="8" value="n_v" /> + <ngram occurrences="8" value="n_sh" /> + <ngram occurrences="8" value="n_g" /> + <ngram occurrences="8" value="n_e" /> + <ngram occurrences="8" value="n_dy_" /> + <ngram occurrences="8" value="n_dy" /> + <ngram occurrences="8" value="n_as_" /> +</ngrams> diff --git a/src/plugins/language/marathi.klp b/src/plugins/language/marathi.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1569" value="þ" /> + <ngram occurrences="1426" value="_" /> + <ngram occurrences="995" value="_þ" /> + <ngram occurrences="895" value="þ_" /> + <ngram occurrences="629" value="þ_þ" /> + <ngram occurrences="464" value="_þ_" /> + <ngram occurrences="367" value="þþ" /> + <ngram occurrences="328" value="_þþ" /> + <ngram occurrences="326" value="_þ_þ" /> + <ngram occurrences="314" value="þþ_" /> + <ngram occurrences="280" value="_þþ_" /> + <ngram occurrences="279" value="þ_þ_" /> + <ngram occurrences="228" value="þþ_þ" /> + <ngram occurrences="217" value="þ_þþ" /> + <ngram occurrences="201" value="_þþ_þ" /> + <ngram occurrences="198" value="þ_þ_þ" /> + <ngram occurrences="183" value="þ_þþ_" /> + <ngram occurrences="142" value="_þ_þ_" /> + <ngram occurrences="139" value="ú" /> + <ngram occurrences="129" value="ú_" /> + <ngram occurrences="125" value="ø" /> + <ngram occurrences="113" value="¨" /> + <ngram occurrences="113" value="_þ_þþ" /> + <ngram occurrences="110" value="ø_" /> + <ngram occurrences="106" value="å" /> + <ngram occurrences="100" value="þþ_þ_" /> + <ngram occurrences="98" value="¨þ" /> + <ngram occurrences="87" value="ú_þ" /> + <ngram occurrences="86" value="¹" /> + <ngram occurrences="85" value="_å" /> + <ngram occurrences="83" value="þþ_þþ" /> + <ngram occurrences="83" value="þú" /> + <ngram occurrences="76" value="þú_" /> + <ngram occurrences="72" value="ø_þ" /> + <ngram occurrences="67" value="_ø" /> + <ngram occurrences="66" value="_þú" /> + <ngram occurrences="63" value="_ø_" /> + <ngram occurrences="62" value="_þú_" /> + <ngram occurrences="54" value="¨þ_" /> + <ngram occurrences="52" value="_¹" /> + <ngram occurrences="50" value="½" /> + <ngram occurrences="49" value="þ_þú" /> + <ngram occurrences="49" value="å_" /> + <ngram occurrences="49" value="µ" /> + <ngram occurrences="48" value="þú_þ" /> + <ngram occurrences="47" value="þ¨" /> + <ngram occurrences="47" value="þ_þú_" /> + <ngram occurrences="47" value="¹_" /> + <ngram occurrences="45" value="þ_ø" /> + <ngram occurrences="45" value="þ_å" /> + <ngram occurrences="44" value="þ_ø_" /> + <ngram occurrences="44" value="_ø_þ" /> + <ngram occurrences="42" value="þø" /> + <ngram occurrences="41" value="þ¨þ" /> + <ngram occurrences="41" value="ú_þ_" /> + <ngram occurrences="41" value="µþ" /> + <ngram occurrences="40" value="û" /> + <ngram occurrences="40" value="¹_þ" /> + <ngram occurrences="40" value="_ú" /> + <ngram occurrences="39" value="½_" /> + <ngram occurrences="39" value="_ú_" /> + <ngram occurrences="38" value="_½" /> + <ngram occurrences="38" value="_þø" /> + <ngram occurrences="38" value="_å_" /> + <ngram occurrences="37" value="¸" /> + <ngram occurrences="37" value="_þú_þ" /> + <ngram occurrences="36" value="¨þ_þ" /> + <ngram occurrences="36" value="_¨" /> + <ngram occurrences="35" value="þø_" /> + <ngram occurrences="35" value="å_þ" /> + <ngram occurrences="33" value="þ_ú" /> + <ngram occurrences="32" value="þ_ú_" /> + <ngram occurrences="32" value="þ_ø_þ" /> + <ngram occurrences="32" value="ø_þ_" /> + <ngram occurrences="31" value="_þø_" /> + <ngram occurrences="30" value="þ¹" /> + <ngram occurrences="30" value="_½_" /> + <ngram occurrences="29" value="þµ" /> + <ngram occurrences="29" value="þ_¹" /> + <ngram occurrences="29" value="¹_þ_" /> + <ngram occurrences="29" value="_þ¨" /> + <ngram occurrences="28" value="þ_þø" /> + <ngram occurrences="28" value="ú_þþ" /> + <ngram occurrences="28" value="_¨þ" /> + <ngram occurrences="28" value="_þ_å" /> + <ngram occurrences="28" value="_å_þ" /> + <ngram occurrences="27" value="ú_þ_þ" /> + <ngram occurrences="27" value="åþ" /> + <ngram occurrences="27" value="_ú_þ" /> + <ngram occurrences="27" value="_¹_" /> + <ngram occurrences="26" value="þ_½" /> + <ngram occurrences="26" value="ú_þþ_" /> + <ngram occurrences="26" value="é" /> + <ngram occurrences="26" value="_åþ" /> + <ngram occurrences="25" value="ù" /> + <ngram occurrences="25" value="_é" /> + <ngram occurrences="24" value="þ¨þ_" /> + <ngram occurrences="24" value="þ_þø_" /> + <ngram occurrences="24" value="é_" /> + <ngram occurrences="24" value="åþ_" /> + <ngram occurrences="24" value="ä" /> + <ngram occurrences="24" value="¹_þ_þ" /> + <ngram occurrences="24" value="µþ_" /> + <ngram occurrences="24" value="_þ_þú" /> + <ngram occurrences="24" value="_þ_ø_" /> + <ngram occurrences="24" value="_þ_ø" /> + <ngram occurrences="24" value="_¹_þ" /> + <ngram occurrences="23" value="½_þ" /> + <ngram occurrences="23" value="þ_¨" /> + <ngram occurrences="23" value="þ_½_" /> + <ngram occurrences="23" value="þ_ú_þ" /> + <ngram occurrences="23" value="ø_þ_þ" /> + <ngram occurrences="23" value="_þ¨þ" /> + <ngram occurrences="23" value="_é_" /> + <ngram occurrences="23" value="_åþ_" /> + <ngram occurrences="22" value="ø_þþ" /> + <ngram occurrences="22" value="ä_" /> + <ngram occurrences="22" value="_þ_½" /> + <ngram occurrences="21" value="¸_" /> + <ngram occurrences="21" value="þú_þ_" /> + <ngram occurrences="21" value="þø_þ" /> + <ngram occurrences="21" value="þµþ" /> + <ngram occurrences="20" value="¨þþ" /> + <ngram occurrences="20" value="þ¹_" /> + <ngram occurrences="20" value="þ_å_" /> + <ngram occurrences="20" value="ø_þþ_" /> + <ngram occurrences="20" value="_þ_½_" /> + <ngram occurrences="20" value="_ø_þ_" /> + <ngram occurrences="20" value="_¹_þ_" /> + <ngram occurrences="19" value="þú_þþ" /> + <ngram occurrences="19" value="_½_þ" /> + <ngram occurrences="18" value="þþ_þú" /> + <ngram occurrences="18" value="þ_¨þ" /> + <ngram occurrences="18" value="þ_þ¨" /> + <ngram occurrences="18" value="þ_þ_å" /> + <ngram occurrences="18" value="å_þ_" /> + <ngram occurrences="18" value="ª" /> + <ngram occurrences="18" value="_þø_þ" /> + <ngram occurrences="18" value="_þ¹" /> + <ngram occurrences="17" value="¨þ_þ_" /> + <ngram occurrences="17" value="åþ_þ" /> + <ngram occurrences="17" value="_þµ" /> + <ngram occurrences="17" value="_þ_þø" /> + <ngram occurrences="16" value="¨þþ_" /> + <ngram occurrences="16" value="þä" /> + <ngram occurrences="16" value="þ¹_þ" /> + <ngram occurrences="16" value="þ_é" /> + <ngram occurrences="16" value="ù_" /> + <ngram occurrences="16" value="ªþ" /> + <ngram occurrences="16" value="_¸" /> + <ngram occurrences="16" value="_þ_¹" /> + <ngram occurrences="16" value="_ø_þþ" /> + <ngram occurrences="16" value="_åþ_þ" /> + <ngram occurrences="15" value="þä_" /> + <ngram occurrences="15" value="þ_½_þ" /> + <ngram occurrences="15" value="þ_þ_ø" /> + <ngram occurrences="15" value="þ_å_þ" /> + <ngram occurrences="15" value="å_þ_þ" /> + <ngram occurrences="14" value="þ¨þ_þ" /> + <ngram occurrences="14" value="þþ_ú_" /> + <ngram occurrences="14" value="þþ_ú" /> + <ngram occurrences="14" value="þû" /> + <ngram occurrences="14" value="þ_þ¨þ" /> + <ngram occurrences="14" value="þ_þ_½" /> + <ngram occurrences="14" value="þ_é_" /> + <ngram occurrences="14" value="û_" /> + <ngram occurrences="14" value="ø_å" /> + <ngram occurrences="14" value="ê" /> + <ngram occurrences="14" value="¹¨þ" /> + <ngram occurrences="14" value="¹¨" /> + <ngram occurrences="14" value="_þ_å_" /> + <ngram occurrences="13" value="þþ¨þ" /> + <ngram occurrences="13" value="þþ¨" /> + <ngram occurrences="13" value="þþ_ø" /> + <ngram occurrences="13" value="þ_åþ" /> + <ngram occurrences="13" value="ê_þ" /> + <ngram occurrences="13" value="ê_" /> + <ngram occurrences="13" value="ä_þ" /> + <ngram occurrences="13" value="_þþ_ú" /> + <ngram occurrences="13" value="_þµþ" /> + <ngram occurrences="13" value="_ê" /> + <ngram occurrences="13" value="_å_þ_" /> + <ngram occurrences="12" value="þþ_ø_" /> + <ngram occurrences="12" value="þþ_å" /> + <ngram occurrences="12" value="þ_¸" /> + <ngram occurrences="12" value="þ_åþ_" /> + <ngram occurrences="12" value="é_þ" /> + <ngram occurrences="12" value="å_þþ" /> + <ngram occurrences="12" value="µþ_þ" /> + <ngram occurrences="12" value="_þ¨þ_" /> + <ngram occurrences="12" value="_þþ¨þ" /> + <ngram occurrences="12" value="_þþ¨" /> + <ngram occurrences="12" value="_þþ_ø" /> + <ngram occurrences="12" value="_û" /> + <ngram occurrences="12" value="_ú_þ_" /> + <ngram occurrences="12" value="_ê_þ" /> + <ngram occurrences="12" value="_ê_" /> + <ngram occurrences="12" value="_é_þ" /> + <ngram occurrences="11" value="¨þþ_þ" /> + <ngram occurrences="11" value="½_þ_" /> + <ngram occurrences="11" value="þû_" /> + <ngram occurrences="11" value="þ_¹_þ" /> + <ngram occurrences="11" value="þ_¹_" /> + <ngram occurrences="11" value="ù_þ" /> + <ngram occurrences="11" value="åþ_þ_" /> + <ngram occurrences="11" value="_¨þ_" /> + <ngram occurrences="10" value="¸_þ" /> + <ngram occurrences="10" value="þþ_¨" /> + <ngram occurrences="10" value="þþ_¹" /> + <ngram occurrences="10" value="þµþ_" /> + <ngram occurrences="10" value="þ_þµ" /> + <ngram occurrences="10" value="þ_ê" /> + <ngram occurrences="10" value="û_þ" /> + <ngram occurrences="10" value="ú_¹" /> + <ngram occurrences="10" value="å_þþ_" /> + <ngram occurrences="10" value="¹¸" /> + <ngram occurrences="10" value="¹¨þ_" /> + <ngram occurrences="10" value="_¨þþ" /> + <ngram occurrences="10" value="_þþ_¨" /> + <ngram occurrences="10" value="_þû" /> + <ngram occurrences="10" value="_þ_åþ" /> + <ngram occurrences="10" value="_ù" /> + <ngram occurrences="10" value="_å_þþ" /> + <ngram occurrences="10" value="_¹¸" /> + <ngram occurrences="10" value="_¹¨þ" /> + <ngram occurrences="10" value="_¹¨" /> + <ngram occurrences="9" value="¨_" /> + <ngram occurrences="9" value="þ¸" /> + <ngram occurrences="9" value="þþ¨þ_" /> + <ngram occurrences="9" value="þþ¹_" /> + <ngram occurrences="9" value="þþ¹" /> + <ngram occurrences="9" value="þû_þ" /> + <ngram occurrences="9" value="þ¹µþ_" /> + <ngram occurrences="9" value="þ¹µþ" /> + <ngram occurrences="9" value="þ¹µ" /> + <ngram occurrences="9" value="þ¹_þ_" /> + <ngram occurrences="9" value="þ_¨þ_" /> + <ngram occurrences="9" value="þ_þ_¹" /> + <ngram occurrences="9" value="þ_ê_þ" /> + <ngram occurrences="9" value="þ_ê_" /> + <ngram occurrences="9" value="ú_å" /> + <ngram occurrences="9" value="ê_þ_" /> + <ngram occurrences="9" value="¹µþ_" /> + <ngram occurrences="9" value="¹µþ" /> + <ngram occurrences="9" value="¹µ" /> + <ngram occurrences="9" value="µþþ_" /> + <ngram occurrences="9" value="µþþ" /> + <ngram occurrences="9" value="_½_þ_" /> + <ngram occurrences="9" value="_þþ¹_" /> + <ngram occurrences="9" value="_þþ¹" /> + <ngram occurrences="9" value="_þþ_å" /> + <ngram occurrences="9" value="_þþ_¹" /> + <ngram occurrences="9" value="_þ¹µþ" /> + <ngram occurrences="9" value="_þ¹µ" /> + <ngram occurrences="9" value="_þ_þ¨" /> + <ngram occurrences="9" value="_þ_ú" /> + <ngram occurrences="8" value="¨þ_þþ" /> + <ngram occurrences="8" value="¨_þ" /> + <ngram occurrences="8" value="½å" /> + <ngram occurrences="8" value="½_þ_þ" /> + <ngram occurrences="8" value="þþ¹_þ" /> + <ngram occurrences="8" value="þþ_þø" /> + <ngram occurrences="8" value="þú_¹" /> + <ngram occurrences="8" value="þø_þ_" /> + <ngram occurrences="8" value="þä_þ" /> + <ngram occurrences="8" value="þ_þþ¨" /> + <ngram occurrences="8" value="þ_þ¹" /> + <ngram occurrences="8" value="þ_¹¨þ" /> + <ngram occurrences="8" value="þ_¹¨" /> + <ngram occurrences="8" value="ä_þ_" /> + <ngram occurrences="8" value="º" /> + <ngram occurrences="8" value="¹¨þ_þ" /> + <ngram occurrences="8" value="µþ_þþ" /> + <ngram occurrences="8" value="_¸_" /> + <ngram occurrences="8" value="_½å" /> + <ngram occurrences="8" value="_þ¹_" /> + <ngram occurrences="8" value="_þµþ_" /> + <ngram occurrences="8" value="_þ_¸" /> + <ngram occurrences="8" value="_þ_¨" /> + <ngram occurrences="8" value="_þ_ú_" /> + <ngram occurrences="8" value="_ê_þ_" /> + <ngram occurrences="7" value="½_þþ_" /> + <ngram occurrences="7" value="½_þþ" /> + <ngram occurrences="7" value="þþ_¨þ" /> + <ngram occurrences="7" value="þþ_þ¨" /> + <ngram occurrences="7" value="þ_¸_" /> + <ngram occurrences="7" value="þ_þµþ" /> + <ngram occurrences="7" value="ûå" /> + <ngram occurrences="7" value="ú_¹_" /> + <ngram occurrences="7" value="ù_þþ" /> + <ngram occurrences="7" value="ï" /> + <ngram occurrences="7" value="µþþ_þ" /> + <ngram occurrences="7" value="ªþ_" /> + <ngram occurrences="7" value="_¨þþ_" /> + <ngram occurrences="7" value="_¨þ_þ" /> + <ngram occurrences="7" value="_þû_" /> + <ngram occurrences="7" value="_þ_¨þ" /> + <ngram occurrences="7" value="_ú_þþ" /> + <ngram occurrences="6" value="¸_þ_" /> + <ngram occurrences="6" value="¨þ_þú" /> + <ngram occurrences="6" value="½å_" /> + <ngram occurrences="6" value="þ¸_" /> + <ngram occurrences="6" value="þ¨þþ" /> + <ngram occurrences="6" value="þ¨_" /> + <ngram occurrences="6" value="þþ¸_" /> + <ngram occurrences="6" value="þþ¸" /> + <ngram occurrences="6" value="þþä" /> + <ngram occurrences="6" value="þþ_ê_" /> + <ngram occurrences="6" value="þþ_ê" /> + <ngram occurrences="6" value="þþ_é_" /> + <ngram occurrences="6" value="þþ_é" /> + <ngram occurrences="6" value="þú_¹_" /> + <ngram occurrences="6" value="þù" /> + <ngram occurrences="6" value="þø_å" /> + <ngram occurrences="6" value="þµþ_þ" /> + <ngram occurrences="6" value="þ_¨þþ" /> + <ngram occurrences="6" value="þ_þû" /> + <ngram occurrences="6" value="þ_û" /> + <ngram occurrences="6" value="þ_é_þ" /> + <ngram occurrences="6" value="þ_¹¸" /> + <ngram occurrences="6" value="ú_¨" /> + <ngram occurrences="6" value="ú_¹_þ" /> + <ngram occurrences="6" value="ø_åþ" /> + <ngram occurrences="6" value="ø_å_" /> + <ngram occurrences="6" value="ø_¹_" /> + <ngram occurrences="6" value="ø_¹" /> + <ngram occurrences="6" value="ï_þ" /> + <ngram occurrences="6" value="ï_" /> + <ngram occurrences="6" value="é_þ_" /> + <ngram occurrences="6" value="åþ_ú_" /> + <ngram occurrences="6" value="åþ_ú" /> + <ngram occurrences="6" value="åû" /> + <ngram occurrences="6" value="åú_þ" /> + <ngram occurrences="6" value="åú_" /> + <ngram occurrences="6" value="åú" /> + <ngram occurrences="6" value="ä_þ_þ" /> + <ngram occurrences="6" value="¹¸_" /> + <ngram occurrences="6" value="_½å_" /> + <ngram occurrences="6" value="_½_þþ" /> + <ngram occurrences="6" value="_þ¨_" /> + <ngram occurrences="6" value="_þþä" /> + <ngram occurrences="6" value="_þþ_ê" /> + <ngram occurrences="6" value="_þþ_é" /> + <ngram occurrences="6" value="_þú_¹" /> + <ngram occurrences="6" value="_þ¹_þ" /> + <ngram occurrences="6" value="_þ_é_" /> + <ngram occurrences="6" value="_þ_é" /> + <ngram occurrences="6" value="_ï" /> + <ngram occurrences="6" value="_é_þ_" /> + <ngram occurrences="6" value="_åþ_ú" /> + <ngram occurrences="6" value="_¹¸_" /> + <ngram occurrences="6" value="_¹¨þ_" /> + <ngram occurrences="6" value="_ªþ" /> + <ngram occurrences="6" value="_ª" /> + <ngram occurrences="5" value="¸þ" /> + <ngram occurrences="5" value="¨þú" /> + <ngram occurrences="5" value="¨þµ" /> + <ngram occurrences="5" value="¨_þþ_" /> + <ngram occurrences="5" value="¨_þþ" /> + <ngram occurrences="5" value="þ¨þþ_" /> + <ngram occurrences="5" value="þ¨_þ" /> + <ngram occurrences="5" value="þþù_" /> + <ngram occurrences="5" value="þþù" /> + <ngram occurrences="5" value="þþä_" /> + <ngram occurrences="5" value="þþµ" /> + <ngram occurrences="5" value="þù_" /> + <ngram occurrences="5" value="þµþú_" /> + <ngram occurrences="5" value="þµþú" /> + <ngram occurrences="5" value="þµø" /> + <ngram occurrences="5" value="þ_þþä" /> + <ngram occurrences="5" value="þ_þþ¹" /> + <ngram occurrences="5" value="þ_þû_" /> + <ngram occurrences="5" value="þ_þ_¨" /> + <ngram occurrences="5" value="þ_ù" /> + <ngram occurrences="5" value="þ_ªþ" /> + <ngram occurrences="5" value="þ_ª" /> + <ngram occurrences="5" value="û½_" /> + <ngram occurrences="5" value="û½" /> + <ngram occurrences="5" value="ûþ" /> + <ngram occurrences="5" value="ú_¨þ" /> + <ngram occurrences="5" value="ú_þú_" /> + <ngram occurrences="5" value="ú_þú" /> + <ngram occurrences="5" value="ú_ø" /> + <ngram occurrences="5" value="ú_å_" /> + <ngram occurrences="5" value="ù_þþ_" /> + <ngram occurrences="5" value="øû" /> + <ngram occurrences="5" value="ø_þú" /> + <ngram occurrences="5" value="ô" /> + <ngram occurrences="5" value="î" /> + <ngram occurrences="5" value="å¨" /> + <ngram occurrences="5" value="â" /> + <ngram occurrences="5" value="¹µþ_þ" /> + <ngram occurrences="5" value="µþú_" /> + <ngram occurrences="5" value="µþú" /> + <ngram occurrences="5" value="µø" /> + <ngram occurrences="5" value="ªþ_þ" /> + <ngram occurrences="5" value="_¸_þ" /> + <ngram occurrences="5" value="_þ¨_þ" /> + <ngram occurrences="5" value="_þþ¸_" /> + <ngram occurrences="5" value="_þþ¸" /> +</ngrams> diff --git a/src/plugins/language/mf.klp b/src/plugins/language/mf.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="740" value="_" /> + <ngram occurrences="454" value="e" /> + <ngram occurrences="236" value="n" /> + <ngram occurrences="235" value="t" /> + <ngram occurrences="216" value="i" /> + <ngram occurrences="193" value="o" /> + <ngram occurrences="191" value="a" /> + <ngram occurrences="165" value="r" /> + <ngram occurrences="138" value="t_" /> + <ngram occurrences="135" value="n_" /> + <ngram occurrences="129" value="s" /> + <ngram occurrences="125" value="e_" /> + <ngram occurrences="117" value="l" /> + <ngram occurrences="108" value="d" /> + <ngram occurrences="100" value="k" /> + <ngram occurrences="85" value="en" /> + <ngram occurrences="83" value="j" /> + <ngram occurrences="79" value="m" /> + <ngram occurrences="75" value="_d" /> + <ngram occurrences="71" value="en_" /> + <ngram occurrences="69" value="h" /> + <ngram occurrences="67" value="er" /> + <ngram occurrences="66" value="g" /> + <ngram occurrences="64" value="y" /> + <ngram occurrences="63" value="w" /> + <ngram occurrences="63" value="r_" /> + <ngram occurrences="55" value="z" /> + <ngram occurrences="55" value="b" /> + <ngram occurrences="52" value="_h" /> + <ngram occurrences="50" value="_t" /> + <ngram occurrences="48" value="s_" /> + <ngram occurrences="47" value="_i" /> + <ngram occurrences="46" value="_m" /> + <ngram occurrences="45" value="_w" /> + <ngram occurrences="42" value="_o" /> + <ngram occurrences="40" value="ie" /> + <ngram occurrences="40" value="et" /> + <ngram occurrences="40" value="er_" /> + <ngram occurrences="40" value="_z" /> + <ngram occurrences="40" value="_s" /> + <ngram occurrences="39" value="u" /> + <ngram occurrences="38" value="v" /> + <ngram occurrences="37" value="k_" /> + <ngram occurrences="36" value="f" /> + <ngram occurrences="35" value="p" /> + <ngram occurrences="35" value="oe" /> + <ngram occurrences="35" value="et_" /> + <ngram occurrences="35" value="_b" /> + <ngram occurrences="34" value="in" /> + <ngram occurrences="34" value="de" /> + <ngram occurrences="32" value="y_" /> + <ngram occurrences="32" value="st" /> + <ngram occurrences="31" value="_k" /> + <ngram occurrences="30" value="te" /> + <ngram occurrences="30" value="he" /> + <ngram occurrences="30" value="an" /> + <ngram occurrences="30" value="_e" /> + <ngram occurrences="29" value="ne" /> + <ngram occurrences="29" value="ei" /> + <ngram occurrences="28" value="ij" /> + <ngram occurrences="28" value="aa" /> + <ngram occurrences="27" value="l_" /> + <ngram occurrences="27" value="_v" /> + <ngram occurrences="26" value="is" /> + <ngram occurrences="26" value="at" /> + <ngram occurrences="25" value="je" /> + <ngram occurrences="25" value="_j" /> + <ngram occurrences="25" value="_he" /> + <ngram occurrences="24" value="oo" /> + <ngram occurrences="24" value="at_" /> + <ngram occurrences="24" value="_g" /> + <ngram occurrences="23" value="on" /> + <ngram occurrences="23" value="le" /> + <ngram occurrences="23" value="da" /> + <ngram occurrences="23" value="a_" /> + <ngram occurrences="23" value="_l" /> + <ngram occurrences="23" value="_f" /> + <ngram occurrences="23" value="_da" /> + <ngram occurrences="22" value="re" /> + <ngram occurrences="22" value="in_" /> + <ngram occurrences="22" value="_n" /> + <ngram occurrences="22" value="_de" /> + <ngram occurrences="21" value="it" /> + <ngram occurrences="20" value="me" /> + <ngram occurrences="20" value="de_" /> + <ngram occurrences="20" value="al" /> + <ngram occurrences="20" value="_t_" /> + <ngram occurrences="20" value="_a" /> + <ngram occurrences="19" value="ze" /> + <ngram occurrences="19" value="or" /> + <ngram occurrences="19" value="is_" /> + <ngram occurrences="19" value="ar" /> + <ngram occurrences="19" value="an_" /> + <ngram occurrences="18" value="el" /> + <ngram occurrences="18" value="ee" /> + <ngram occurrences="17" value="ge" /> + <ngram occurrences="17" value="g_" /> + <ngram occurrences="16" value="n_d" /> + <ngram occurrences="16" value="ll" /> + <ngram occurrences="16" value="ik" /> + <ngram occurrences="16" value="_me" /> + <ngram occurrences="16" value="_en_" /> + <ngram occurrences="16" value="_en" /> + <ngram occurrences="16" value="_de_" /> + <ngram occurrences="15" value="æ" /> + <ngram occurrences="15" value="te_" /> + <ngram occurrences="15" value="ma" /> + <ngram occurrences="15" value="j_" /> + <ngram occurrences="15" value="het_" /> + <ngram occurrences="15" value="het" /> + <ngram occurrences="15" value="dat_" /> + <ngram occurrences="15" value="dat" /> + <ngram occurrences="15" value="be" /> + <ngram occurrences="15" value="_het_" /> + <ngram occurrences="15" value="_het" /> + <ngram occurrences="15" value="_dat_" /> + <ngram occurrences="15" value="_dat" /> + <ngram occurrences="14" value="wi" /> + <ngram occurrences="14" value="ve" /> + <ngram occurrences="14" value="nt" /> + <ngram occurrences="14" value="ne_" /> + <ngram occurrences="14" value="m_" /> + <ngram occurrences="14" value="ik_" /> + <ngram occurrences="14" value="es" /> + <ngram occurrences="14" value="di" /> + <ngram occurrences="13" value="yn" /> + <ngram occurrences="13" value="we" /> + <ngram occurrences="13" value="ri" /> + <ngram occurrences="13" value="ol" /> + <ngram occurrences="13" value="n_m" /> + <ngram occurrences="13" value="li" /> + <ngram occurrences="13" value="ke" /> + <ngram occurrences="13" value="je_" /> + <ngram occurrences="13" value="it_" /> + <ngram occurrences="13" value="ij_" /> + <ngram occurrences="13" value="i_" /> + <ngram occurrences="13" value="d_" /> + <ngram occurrences="13" value="_y" /> + <ngram occurrences="13" value="_ik_" /> + <ngram occurrences="13" value="_ik" /> + <ngram occurrences="13" value="_di" /> + <ngram occurrences="12" value="zi" /> + <ngram occurrences="12" value="wa" /> + <ngram occurrences="12" value="t_o" /> + <ngram occurrences="12" value="ro" /> + <ngram occurrences="12" value="p_" /> + <ngram occurrences="12" value="ou" /> + <ngram occurrences="12" value="lle" /> + <ngram occurrences="12" value="la" /> + <ngram occurrences="12" value="jo" /> + <ngram occurrences="12" value="ien" /> + <ngram occurrences="12" value="hi" /> + <ngram occurrences="12" value="ha" /> + <ngram occurrences="12" value="ei_" /> + <ngram occurrences="12" value="ch" /> + <ngram occurrences="12" value="c" /> + <ngram occurrences="12" value="_ne" /> + <ngram occurrences="12" value="_al" /> + <ngram occurrences="11" value="tj" /> + <ngram occurrences="11" value="ta" /> + <ngram occurrences="11" value="t_w" /> + <ngram occurrences="11" value="t_d" /> + <ngram occurrences="11" value="om" /> + <ngram occurrences="11" value="nn" /> + <ngram occurrences="11" value="n_e" /> + <ngram occurrences="11" value="le_" /> + <ngram occurrences="11" value="il" /> + <ngram occurrences="11" value="ier" /> + <ngram occurrences="11" value="ar_" /> + <ngram occurrences="11" value="_in" /> + <ngram occurrences="11" value="_ha" /> + <ngram occurrences="10" value="wo" /> + <ngram occurrences="10" value="t_s" /> + <ngram occurrences="10" value="ste" /> + <ngram occurrences="10" value="sch" /> + <ngram occurrences="10" value="sc" /> + <ngram occurrences="10" value="re_" /> + <ngram occurrences="10" value="nt_" /> + <ngram occurrences="10" value="nne" /> + <ngram occurrences="10" value="n_t" /> + <ngram occurrences="10" value="n_h" /> + <ngram occurrences="10" value="lle_" /> + <ngram occurrences="10" value="e_h" /> + <ngram occurrences="10" value="der_" /> + <ngram occurrences="10" value="der" /> + <ngram occurrences="10" value="_zi" /> + <ngram occurrences="10" value="_wi" /> + <ngram occurrences="10" value="_wa" /> + <ngram occurrences="10" value="_st" /> + <ngram occurrences="10" value="_p" /> + <ngram occurrences="10" value="_oo" /> + <ngram occurrences="10" value="_ma" /> + <ngram occurrences="10" value="_is_" /> + <ngram occurrences="10" value="_is" /> + <ngram occurrences="10" value="_in_" /> + <ngram occurrences="9" value="zo" /> + <ngram occurrences="9" value="vo" /> + <ngram occurrences="9" value="t_i" /> + <ngram occurrences="9" value="ok" /> + <ngram occurrences="9" value="og" /> + <ngram occurrences="9" value="nne_" /> + <ngram occurrences="9" value="n_g" /> + <ngram occurrences="9" value="mei" /> + <ngram occurrences="9" value="ko" /> + <ngram occurrences="9" value="ig" /> + <ngram occurrences="9" value="fo" /> + <ngram occurrences="9" value="ea" /> + <ngram occurrences="9" value="e_k" /> + <ngram occurrences="9" value="e_f" /> + <ngram occurrences="9" value="aar" /> + <ngram occurrences="9" value="_zo" /> + <ngram occurrences="9" value="_ze" /> + <ngram occurrences="9" value="_we" /> + <ngram occurrences="9" value="_mei" /> + <ngram occurrences="9" value="_ko" /> + <ngram occurrences="9" value="_jo" /> + <ngram occurrences="9" value="_ie" /> + <ngram occurrences="9" value="_hi" /> + <ngram occurrences="9" value="_fo" /> + <ngram occurrences="8" value="yn_" /> + <ngram occurrences="8" value="ver" /> + <ngram occurrences="8" value="tr" /> + <ngram occurrences="8" value="t_t" /> + <ngram occurrences="8" value="t_h" /> + <ngram occurrences="8" value="t_b" /> + <ngram occurrences="8" value="st_" /> + <ngram occurrences="8" value="oor" /> + <ngram occurrences="8" value="oer" /> + <ngram occurrences="8" value="ni" /> + <ngram occurrences="8" value="mei_" /> + <ngram occurrences="8" value="kr" /> + <ngram occurrences="8" value="iet" /> + <ngram occurrences="8" value="ier_" /> + <ngram occurrences="8" value="ien_" /> + <ngram occurrences="8" value="en_m" /> + <ngram occurrences="8" value="e_s" /> + <ngram occurrences="8" value="e_j" /> + <ngram occurrences="8" value="e_i" /> + <ngram occurrences="8" value="br" /> + <ngram occurrences="8" value="bo" /> + <ngram occurrences="8" value="al_" /> + <ngram occurrences="8" value="_vo" /> + <ngram occurrences="8" value="_r" /> + <ngram occurrences="8" value="_mei_" /> + <ngram occurrences="8" value="_be" /> + <ngram occurrences="7" value="zil" /> + <ngram occurrences="7" value="uw" /> + <ngram occurrences="7" value="u_" /> + <ngram occurrences="7" value="ti" /> + <ngram occurrences="7" value="ta_" /> + <ngram occurrences="7" value="t_m" /> + <ngram occurrences="7" value="t_g" /> + <ngram occurrences="7" value="se" /> + <ngram occurrences="7" value="ry" /> + <ngram occurrences="7" value="rs" /> + <ngram occurrences="7" value="rre_" /> + <ngram occurrences="7" value="rre" /> + <ngram occurrences="7" value="rr" /> + <ngram occurrences="7" value="ra" /> + <ngram occurrences="7" value="or_" /> + <ngram occurrences="7" value="op" /> + <ngram occurrences="7" value="oon" /> + <ngram occurrences="7" value="ol_" /> + <ngram occurrences="7" value="of" /> + <ngram occurrences="7" value="oe_" /> + <ngram occurrences="7" value="ns" /> + <ngram occurrences="7" value="nk" /> + <ngram occurrences="7" value="net_" /> + <ngram occurrences="7" value="net" /> + <ngram occurrences="7" value="n_w" /> + <ngram occurrences="7" value="n_o" /> + <ngram occurrences="7" value="n_k" /> + <ngram occurrences="7" value="n_i" /> + <ngram occurrences="7" value="mi" /> + <ngram occurrences="7" value="jn" /> + <ngram occurrences="7" value="ji" /> + <ngram occurrences="7" value="ijn" /> + <ngram occurrences="7" value="iet_" /> + <ngram occurrences="7" value="hie" /> + <ngram occurrences="7" value="gt" /> + <ngram occurrences="7" value="f_" /> + <ngram occurrences="7" value="en_d" /> + <ngram occurrences="7" value="el_" /> + <ngram occurrences="7" value="ek" /> + <ngram occurrences="7" value="eit_" /> + <ngram occurrences="7" value="eit" /> + <ngram occurrences="7" value="eg" /> + <ngram occurrences="7" value="eer" /> + <ngram occurrences="7" value="ed" /> + <ngram occurrences="7" value="e_v" /> + <ngram occurrences="7" value="e_o" /> + <ngram occurrences="7" value="dy_" /> + <ngram occurrences="7" value="dy" /> + <ngram occurrences="7" value="do" /> + <ngram occurrences="7" value="dij" /> + <ngram occurrences="7" value="as" /> + <ngram occurrences="7" value="aar_" /> + <ngram occurrences="7" value="_zil" /> + <ngram occurrences="7" value="_yn" /> + <ngram occurrences="7" value="_wo" /> + <ngram occurrences="7" value="_ta_" /> + <ngram occurrences="7" value="_ta" /> + <ngram occurrences="7" value="_sch" /> + <ngram occurrences="7" value="_sc" /> + <ngram occurrences="7" value="_net_" /> + <ngram occurrences="7" value="_net" /> + <ngram occurrences="7" value="_mi" /> + <ngram occurrences="7" value="_li" /> + <ngram occurrences="7" value="_kr" /> + <ngram occurrences="7" value="_ien" /> + <ngram occurrences="7" value="_hie" /> + <ngram occurrences="7" value="_dy_" /> + <ngram occurrences="7" value="_dy" /> + <ngram occurrences="7" value="_do" /> + <ngram occurrences="7" value="_dij" /> + <ngram occurrences="7" value="_al_" /> + <ngram occurrences="6" value="za" /> + <ngram occurrences="6" value="wol_" /> + <ngram occurrences="6" value="wol" /> + <ngram occurrences="6" value="tte" /> + <ngram occurrences="6" value="tt" /> + <ngram occurrences="6" value="to" /> + <ngram occurrences="6" value="tje" /> + <ngram occurrences="6" value="ten_" /> + <ngram occurrences="6" value="ten" /> + <ngram occurrences="6" value="t_z" /> + <ngram occurrences="6" value="t_l" /> + <ngram occurrences="6" value="t_e" /> + <ngram occurrences="6" value="t_da" /> + <ngram occurrences="6" value="ste_" /> + <ngram occurrences="6" value="s_i" /> + <ngram occurrences="6" value="rt" /> + <ngram occurrences="6" value="rk" /> + <ngram occurrences="6" value="r_t" /> + <ngram occurrences="6" value="r_i" /> + <ngram occurrences="6" value="ou_" /> + <ngram occurrences="6" value="op_" /> + <ngram occurrences="6" value="ont" /> + <ngram occurrences="6" value="on_" /> + <ngram occurrences="6" value="om_" /> + <ngram occurrences="6" value="o_" /> + <ngram occurrences="6" value="ng" /> + <ngram occurrences="6" value="n_z" /> + <ngram occurrences="6" value="n_he" /> + <ngram occurrences="6" value="n_en_" /> + <ngram occurrences="6" value="n_en" /> + <ngram occurrences="6" value="my" /> + <ngram occurrences="6" value="mo" /> + <ngram occurrences="6" value="man" /> + <ngram occurrences="6" value="m_d" /> + <ngram occurrences="6" value="kk" /> + <ngram occurrences="6" value="kj" /> + <ngram occurrences="6" value="k_w" /> + <ngram occurrences="6" value="jn_" /> + <ngram occurrences="6" value="jen" /> + <ngram occurrences="6" value="ja" /> + <ngram occurrences="6" value="ijn_" /> + <ngram occurrences="6" value="hei" /> + <ngram occurrences="6" value="est" /> + <ngram occurrences="6" value="ere" /> + <ngram occurrences="6" value="en_h" /> + <ngram occurrences="6" value="e_w" /> + <ngram occurrences="6" value="e_t" /> + <ngram occurrences="6" value="e_m" /> + <ngram occurrences="6" value="e_he" /> + <ngram occurrences="6" value="e_d" /> + <ngram occurrences="6" value="am" /> + <ngram occurrences="6" value="aan_" /> + <ngram occurrences="6" value="aan" /> + <ngram occurrences="6" value="_za" /> + <ngram occurrences="6" value="_ve" /> + <ngram occurrences="6" value="_tr" /> + <ngram occurrences="6" value="_tj" /> + <ngram occurrences="6" value="_op_" /> + <ngram occurrences="6" value="_op" /> + <ngram occurrences="6" value="_om" /> + <ngram occurrences="6" value="_my" /> + <ngram occurrences="6" value="_mo" /> + <ngram occurrences="6" value="_la" /> + <ngram occurrences="6" value="_ien_" /> + <ngram occurrences="6" value="_ge" /> + <ngram occurrences="6" value="_ee" /> + <ngram occurrences="6" value="_br" /> + <ngram occurrences="5" value="zy" /> + <ngram occurrences="5" value="zen" /> + <ngram occurrences="5" value="y_d" /> + <ngram occurrences="5" value="wy" /> + <ngram occurrences="5" value="wie" /> + <ngram occurrences="5" value="va" /> + <ngram occurrences="5" value="ui" /> + <ngram occurrences="5" value="t_oo" /> + <ngram occurrences="5" value="t_k" /> + <ngram occurrences="5" value="t_is_" /> + <ngram occurrences="5" value="t_is" /> + <ngram occurrences="5" value="t_be" /> + <ngram occurrences="5" value="so" /> + <ngram occurrences="5" value="si" /> + <ngram occurrences="5" value="s_z" /> + <ngram occurrences="5" value="s_h" /> + <ngram occurrences="5" value="s_b" /> +</ngrams> diff --git a/src/plugins/language/middle-frisian.klp b/src/plugins/language/middle-frisian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="721" value="_" /> + <ngram occurrences="468" value="e" /> + <ngram occurrences="259" value="n" /> + <ngram occurrences="229" value="t" /> + <ngram occurrences="187" value="i" /> + <ngram occurrences="183" value="a" /> + <ngram occurrences="176" value="o" /> + <ngram occurrences="174" value="r" /> + <ngram occurrences="153" value="n_" /> + <ngram occurrences="129" value="t_" /> + <ngram occurrences="128" value="d" /> + <ngram occurrences="123" value="s" /> + <ngram occurrences="117" value="e_" /> + <ngram occurrences="107" value="l" /> + <ngram occurrences="94" value="en" /> + <ngram occurrences="81" value="m" /> + <ngram occurrences="80" value="g" /> + <ngram occurrences="80" value="en_" /> + <ngram occurrences="78" value="k" /> + <ngram occurrences="76" value="er" /> + <ngram occurrences="71" value="j" /> + <ngram occurrences="69" value="h" /> + <ngram occurrences="69" value="_d" /> + <ngram occurrences="66" value="y" /> + <ngram occurrences="65" value="r_" /> + <ngram occurrences="58" value="u" /> + <ngram occurrences="57" value="w" /> + <ngram occurrences="55" value="_h" /> + <ngram occurrences="49" value="z" /> + <ngram occurrences="48" value="b" /> + <ngram occurrences="48" value="_m" /> + <ngram occurrences="47" value="_t" /> + <ngram occurrences="44" value="_w" /> + <ngram occurrences="43" value="ie" /> + <ngram occurrences="43" value="er_" /> + <ngram occurrences="42" value="p" /> + <ngram occurrences="42" value="de" /> + <ngram occurrences="41" value="f" /> + <ngram occurrences="40" value="et" /> + <ngram occurrences="40" value="_i" /> + <ngram occurrences="39" value="v" /> + <ngram occurrences="38" value="s_" /> + <ngram occurrences="38" value="in" /> + <ngram occurrences="37" value="_o" /> + <ngram occurrences="36" value="_b" /> + <ngram occurrences="35" value="an" /> + <ngram occurrences="34" value="te" /> + <ngram occurrences="34" value="st" /> + <ngram occurrences="34" value="_z" /> + <ngram occurrences="34" value="_v" /> + <ngram occurrences="34" value="_e" /> + <ngram occurrences="33" value="_s" /> + <ngram occurrences="32" value="_n" /> + <ngram occurrences="31" value="et_" /> + <ngram occurrences="30" value="_g" /> + <ngram occurrences="29" value="he" /> + <ngram occurrences="29" value="d_" /> + <ngram occurrences="29" value="_k" /> + <ngram occurrences="27" value="y_" /> + <ngram occurrences="27" value="ge" /> + <ngram occurrences="26" value="_he" /> + <ngram occurrences="25" value="re" /> + <ngram occurrences="25" value="oe" /> + <ngram occurrences="25" value="el" /> + <ngram occurrences="25" value="ee" /> + <ngram occurrences="25" value="at" /> + <ngram occurrences="24" value="ne" /> + <ngram occurrences="24" value="k_" /> + <ngram occurrences="24" value="_j" /> + <ngram occurrences="24" value="_de" /> + <ngram occurrences="23" value="de_" /> + <ngram occurrences="23" value="ar" /> + <ngram occurrences="23" value="an_" /> + <ngram occurrences="22" value="me" /> + <ngram occurrences="22" value="l_" /> + <ngram occurrences="22" value="ke" /> + <ngram occurrences="22" value="in_" /> + <ngram occurrences="22" value="at_" /> + <ngram occurrences="21" value="yn" /> + <ngram occurrences="21" value="it" /> + <ngram occurrences="21" value="da" /> + <ngram occurrences="21" value="_da" /> + <ngram occurrences="20" value="is" /> + <ngram occurrences="20" value="ij" /> + <ngram occurrences="20" value="g_" /> + <ngram occurrences="19" value="oo" /> + <ngram occurrences="19" value="je" /> + <ngram occurrences="19" value="aa" /> + <ngram occurrences="19" value="_en_" /> + <ngram occurrences="19" value="_en" /> + <ngram occurrences="18" value="c" /> + <ngram occurrences="18" value="_l" /> + <ngram occurrences="18" value="_de_" /> + <ngram occurrences="18" value="_a" /> + <ngram occurrences="17" value="t_d" /> + <ngram occurrences="17" value="st_" /> + <ngram occurrences="17" value="or" /> + <ngram occurrences="17" value="ol" /> + <ngram occurrences="17" value="a_" /> + <ngram occurrences="17" value="_f" /> + <ngram occurrences="16" value="ze" /> + <ngram occurrences="16" value="op" /> + <ngram occurrences="16" value="_t_" /> + <ngram occurrences="15" value="yn_" /> + <ngram occurrences="15" value="va" /> + <ngram occurrences="15" value="te_" /> + <ngram occurrences="15" value="on" /> + <ngram occurrences="15" value="nd" /> + <ngram occurrences="15" value="n_h" /> + <ngram occurrences="15" value="le" /> + <ngram occurrences="15" value="_me" /> + <ngram occurrences="14" value="æ" /> + <ngram occurrences="14" value="p_" /> + <ngram occurrences="14" value="no" /> + <ngram occurrences="14" value="ma" /> + <ngram occurrences="14" value="m_" /> + <ngram occurrences="14" value="di" /> + <ngram occurrences="14" value="der" /> + <ngram occurrences="14" value="_va" /> + <ngram occurrences="13" value="wa" /> + <ngram occurrences="13" value="ve" /> + <ngram occurrences="13" value="ou" /> + <ngram occurrences="13" value="om" /> + <ngram occurrences="13" value="n_t" /> + <ngram occurrences="13" value="la" /> + <ngram occurrences="13" value="f_" /> + <ngram occurrences="13" value="eg" /> + <ngram occurrences="13" value="e_w" /> + <ngram occurrences="13" value="ch" /> + <ngram occurrences="13" value="ar_" /> + <ngram occurrences="13" value="_ma" /> + <ngram occurrences="13" value="_in" /> + <ngram occurrences="12" value="ti" /> + <ngram occurrences="12" value="n_o" /> + <ngram occurrences="12" value="n_m" /> + <ngram occurrences="12" value="ll" /> + <ngram occurrences="12" value="it_" /> + <ngram occurrences="12" value="es" /> + <ngram occurrences="12" value="as" /> + <ngram occurrences="12" value="al" /> + <ngram occurrences="12" value="_wa" /> + <ngram occurrences="12" value="_p" /> + <ngram occurrences="12" value="_op" /> + <ngram occurrences="12" value="_no" /> + <ngram occurrences="12" value="_ge" /> + <ngram occurrences="11" value="we" /> + <ngram occurrences="11" value="tte" /> + <ngram occurrences="11" value="tt" /> + <ngram occurrences="11" value="tj" /> + <ngram occurrences="11" value="t_m" /> + <ngram occurrences="11" value="sch" /> + <ngram occurrences="11" value="sc" /> + <ngram occurrences="11" value="ro" /> + <ngram occurrences="11" value="ri" /> + <ngram occurrences="11" value="ne_" /> + <ngram occurrences="11" value="n_b" /> + <ngram occurrences="11" value="my" /> + <ngram occurrences="11" value="li" /> + <ngram occurrences="11" value="ko" /> + <ngram occurrences="11" value="is_" /> + <ngram occurrences="11" value="ho" /> + <ngram occurrences="11" value="het_" /> + <ngram occurrences="11" value="het" /> + <ngram occurrences="11" value="el_" /> + <ngram occurrences="11" value="der_" /> + <ngram occurrences="11" value="be" /> + <ngram occurrences="11" value="_u" /> + <ngram occurrences="11" value="_in_" /> + <ngram occurrences="11" value="_het_" /> + <ngram occurrences="11" value="_het" /> + <ngram occurrences="11" value="_di" /> + <ngram occurrences="10" value="wi" /> + <ngram occurrences="10" value="u_" /> + <ngram occurrences="10" value="t_h" /> + <ngram occurrences="10" value="rt" /> + <ngram occurrences="10" value="op_" /> + <ngram occurrences="10" value="ng" /> + <ngram occurrences="10" value="n_i" /> + <ngram occurrences="10" value="lle_" /> + <ngram occurrences="10" value="lle" /> + <ngram occurrences="10" value="le_" /> + <ngram occurrences="10" value="jo" /> + <ngram occurrences="10" value="jn" /> + <ngram occurrences="10" value="ji" /> + <ngram occurrences="10" value="en_m" /> + <ngram occurrences="10" value="ei" /> + <ngram occurrences="10" value="dat" /> + <ngram occurrences="10" value="_ve" /> + <ngram occurrences="10" value="_te" /> + <ngram occurrences="10" value="_my" /> + <ngram occurrences="10" value="_dat" /> + <ngram occurrences="9" value="za" /> + <ngram occurrences="9" value="ui" /> + <ngram occurrences="9" value="ter" /> + <ngram occurrences="9" value="r_i" /> + <ngram occurrences="9" value="of" /> + <ngram occurrences="9" value="nne_" /> + <ngram occurrences="9" value="nne" /> + <ngram occurrences="9" value="nn" /> + <ngram occurrences="9" value="n_he" /> + <ngram occurrences="9" value="j_" /> + <ngram occurrences="9" value="ien" /> + <ngram occurrences="9" value="ha" /> + <ngram occurrences="9" value="eer" /> + <ngram occurrences="9" value="e_h" /> + <ngram occurrences="9" value="e_d" /> + <ngram occurrences="9" value="dat_" /> + <ngram occurrences="9" value="aar" /> + <ngram occurrences="9" value="_za" /> + <ngram occurrences="9" value="_te_" /> + <ngram occurrences="9" value="_ne" /> + <ngram occurrences="9" value="_ko" /> + <ngram occurrences="9" value="_dat_" /> + <ngram occurrences="8" value="zy" /> + <ngram occurrences="8" value="wo" /> + <ngram occurrences="8" value="vo" /> + <ngram occurrences="8" value="ver" /> + <ngram occurrences="8" value="van" /> + <ngram occurrences="8" value="uw" /> + <ngram occurrences="8" value="t_z" /> + <ngram occurrences="8" value="t_v" /> + <ngram occurrences="8" value="t_t" /> + <ngram occurrences="8" value="og" /> + <ngram occurrences="8" value="n_s" /> + <ngram occurrences="8" value="n_e" /> + <ngram occurrences="8" value="n_d" /> + <ngram occurrences="8" value="mi" /> + <ngram occurrences="8" value="ke_" /> + <ngram occurrences="8" value="jn_" /> + <ngram occurrences="8" value="jen_" /> + <ngram occurrences="8" value="jen" /> + <ngram occurrences="8" value="il" /> + <ngram occurrences="8" value="ijn" /> + <ngram occurrences="8" value="ij_" /> + <ngram occurrences="8" value="ier" /> + <ngram occurrences="8" value="ie_" /> + <ngram occurrences="8" value="gt" /> + <ngram occurrences="8" value="gr" /> + <ngram occurrences="8" value="gen" /> + <ngram occurrences="8" value="fe" /> + <ngram occurrences="8" value="en_o" /> + <ngram occurrences="8" value="ed" /> + <ngram occurrences="8" value="ea" /> + <ngram occurrences="8" value="dan_" /> + <ngram occurrences="8" value="dan" /> + <ngram occurrences="8" value="_zy" /> + <ngram occurrences="8" value="_wi" /> + <ngram occurrences="8" value="_van" /> + <ngram occurrences="8" value="_sch" /> + <ngram occurrences="8" value="_sc" /> + <ngram occurrences="8" value="_r" /> + <ngram occurrences="8" value="_ji" /> + <ngram occurrences="8" value="_ho" /> + <ngram occurrences="8" value="_ha" /> + <ngram occurrences="8" value="_gr" /> + <ngram occurrences="8" value="_dan_" /> + <ngram occurrences="8" value="_dan" /> + <ngram occurrences="7" value="zi" /> + <ngram occurrences="7" value="za_" /> + <ngram occurrences="7" value="wy" /> + <ngram occurrences="7" value="wat_" /> + <ngram occurrences="7" value="wat" /> + <ngram occurrences="7" value="van_" /> + <ngram occurrences="7" value="tr" /> + <ngram occurrences="7" value="ta" /> + <ngram occurrences="7" value="t_s" /> + <ngram occurrences="7" value="t_b" /> + <ngram occurrences="7" value="ss" /> + <ngram occurrences="7" value="ren_" /> + <ngram occurrences="7" value="ren" /> + <ngram occurrences="7" value="or_" /> + <ngram occurrences="7" value="om_" /> + <ngram occurrences="7" value="oll" /> + <ngram occurrences="7" value="nk" /> + <ngram occurrences="7" value="ni" /> + <ngram occurrences="7" value="net" /> + <ngram occurrences="7" value="n_n" /> + <ngram occurrences="7" value="men_" /> + <ngram occurrences="7" value="men" /> + <ngram occurrences="7" value="ken" /> + <ngram occurrences="7" value="je_" /> + <ngram occurrences="7" value="ik_" /> + <ngram occurrences="7" value="ik" /> + <ngram occurrences="7" value="ijn_" /> + <ngram occurrences="7" value="i_" /> + <ngram occurrences="7" value="hi" /> + <ngram occurrences="7" value="hee" /> + <ngram occurrences="7" value="gt_" /> + <ngram occurrences="7" value="eu" /> + <ngram occurrences="7" value="est" /> + <ngram occurrences="7" value="ek" /> + <ngram occurrences="7" value="e_z" /> + <ngram occurrences="7" value="e_v" /> + <ngram occurrences="7" value="e_k" /> + <ngram occurrences="7" value="e_b" /> + <ngram occurrences="7" value="do" /> + <ngram occurrences="7" value="by" /> + <ngram occurrences="7" value="and" /> + <ngram occurrences="7" value="ae" /> + <ngram occurrences="7" value="_ze" /> + <ngram occurrences="7" value="_za_" /> + <ngram occurrences="7" value="_wo" /> + <ngram occurrences="7" value="_we" /> + <ngram occurrences="7" value="_wat_" /> + <ngram occurrences="7" value="_wat" /> + <ngram occurrences="7" value="_vo" /> + <ngram occurrences="7" value="_ver" /> + <ngram occurrences="7" value="_van_" /> + <ngram occurrences="7" value="_op_" /> + <ngram occurrences="7" value="_oo" /> + <ngram occurrences="7" value="_of" /> + <ngram occurrences="7" value="_mi" /> + <ngram occurrences="7" value="_fe" /> + <ngram occurrences="7" value="_by" /> + <ngram occurrences="7" value="_be" /> + <ngram occurrences="6" value="zyn_" /> + <ngram occurrences="6" value="zyn" /> + <ngram occurrences="6" value="zen" /> + <ngram occurrences="6" value="yn_h" /> + <ngram occurrences="6" value="wie" /> + <ngram occurrences="6" value="us" /> + <ngram occurrences="6" value="ud" /> + <ngram occurrences="6" value="to" /> + <ngram occurrences="6" value="tje" /> + <ngram occurrences="6" value="tie" /> + <ngram occurrences="6" value="ter_" /> + <ngram occurrences="6" value="t_w" /> + <ngram occurrences="6" value="t_j" /> + <ngram occurrences="6" value="t_g" /> + <ngram occurrences="6" value="se" /> + <ngram occurrences="6" value="ry" /> + <ngram occurrences="6" value="rs" /> + <ngram occurrences="6" value="re_" /> + <ngram occurrences="6" value="rd" /> + <ngram occurrences="6" value="r_d" /> + <ngram occurrences="6" value="pr" /> + <ngram occurrences="6" value="ou_" /> + <ngram occurrences="6" value="oor" /> + <ngram occurrences="6" value="olle_" /> + <ngram occurrences="6" value="olle" /> + <ngram occurrences="6" value="of_" /> + <ngram occurrences="6" value="oer" /> + <ngram occurrences="6" value="ns" /> + <ngram occurrences="6" value="net_" /> + <ngram occurrences="6" value="nder" /> + <ngram occurrences="6" value="nde" /> + <ngram occurrences="6" value="n_w" /> + <ngram occurrences="6" value="n_v" /> + <ngram occurrences="6" value="n_t_" /> + <ngram occurrences="6" value="n_k" /> + <ngram occurrences="6" value="n_hee" /> + <ngram occurrences="6" value="lit" /> + <ngram occurrences="6" value="lan" /> + <ngram occurrences="6" value="l_m" /> + <ngram occurrences="6" value="ken_" /> + <ngram occurrences="6" value="jie" /> + <ngram occurrences="6" value="ist" /> + <ngram occurrences="6" value="ig" /> + <ngram occurrences="6" value="iet_" /> + <ngram occurrences="6" value="iet" /> + <ngram occurrences="6" value="ien_" /> + <ngram occurrences="6" value="heer_" /> + <ngram occurrences="6" value="heer" /> + <ngram occurrences="6" value="gen_" /> + <ngram occurrences="6" value="fi" /> + <ngram occurrences="6" value="est_" /> + <ngram occurrences="6" value="ert" /> + <ngram occurrences="6" value="ere" /> + <ngram occurrences="6" value="er_i" /> + <ngram occurrences="6" value="en_n" /> + <ngram occurrences="6" value="em" /> + <ngram occurrences="6" value="eer_" /> + <ngram occurrences="6" value="e_t" /> + <ngram occurrences="6" value="e_s" /> + <ngram occurrences="6" value="e_l" /> + <ngram occurrences="6" value="e_j" /> + <ngram occurrences="6" value="e_e" /> + <ngram occurrences="6" value="dij" /> + <ngram occurrences="6" value="bo" /> + <ngram occurrences="6" value="af" /> + <ngram occurrences="6" value="_zyn_" /> + <ngram occurrences="6" value="_zyn" /> + <ngram occurrences="6" value="_zi" /> + <ngram occurrences="6" value="_wy" /> + <ngram occurrences="6" value="_tj" /> + <ngram occurrences="6" value="_st" /> + <ngram occurrences="6" value="_of_" /> + <ngram occurrences="6" value="_net_" /> + <ngram occurrences="6" value="_net" /> + <ngram occurrences="6" value="_la" /> + <ngram occurrences="6" value="_is" /> + <ngram occurrences="6" value="_ik_" /> + <ngram occurrences="6" value="_ik" /> + <ngram occurrences="6" value="_ie" /> + <ngram occurrences="6" value="_heer" /> + <ngram occurrences="6" value="_hee" /> + <ngram occurrences="6" value="_er" /> + <ngram occurrences="6" value="_dij" /> + <ngram occurrences="6" value="_der_" /> + <ngram occurrences="6" value="_der" /> +</ngrams> diff --git a/src/plugins/language/mingo.klp b/src/plugins/language/mingo.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="775" value="_" /> + <ngram occurrences="342" value="n" /> + <ngram occurrences="321" value="a" /> + <ngram occurrences="309" value="t" /> + <ngram occurrences="307" value="k" /> + <ngram occurrences="236" value="e" /> + <ngram occurrences="225" value="ë" /> + <ngram occurrences="222" value="h" /> + <ngram occurrences="194" value="u" /> + <ngram occurrences="190" value="s" /> + <ngram occurrences="187" value="y" /> + <ngram occurrences="184" value="_n" /> + <ngram occurrences="175" value="w" /> + <ngram occurrences="159" value="e_" /> + <ngram occurrences="157" value="ö" /> + <ngram occurrences="115" value="_t" /> + <ngram occurrences="110" value="_k" /> + <ngram occurrences="101" value="ne" /> + <ngram occurrences="94" value="u_" /> + <ngram occurrences="92" value="ne_" /> + <ngram occurrences="92" value="_ne" /> + <ngram occurrences="90" value="i" /> + <ngram occurrences="90" value="_ne_" /> + <ngram occurrences="83" value="a_" /> + <ngram occurrences="82" value="ô" /> + <ngram occurrences="74" value="ö_" /> + <ngram occurrences="70" value="ë_" /> + <ngram occurrences="67" value="wa" /> + <ngram occurrences="65" value="_h" /> + <ngram occurrences="60" value="á" /> + <ngram occurrences="59" value="_ë" /> + <ngram occurrences="57" value="kw" /> + <ngram occurrences="55" value="_u" /> + <ngram occurrences="54" value="ê" /> + <ngram occurrences="54" value="é" /> + <ngram occurrences="54" value="hu" /> + <ngram occurrences="50" value="s_" /> + <ngram occurrences="48" value="í" /> + <ngram occurrences="47" value="nö" /> + <ngram occurrences="46" value="at" /> + <ngram occurrences="44" value="ta" /> + <ngram occurrences="44" value="ka" /> + <ngram occurrences="43" value="yu" /> + <ngram occurrences="43" value="ak" /> + <ngram occurrences="42" value="ha" /> + <ngram occurrences="41" value="kh" /> + <ngram occurrences="41" value="_s" /> + <ngram occurrences="39" value="wë" /> + <ngram occurrences="38" value="hs" /> + <ngram occurrences="38" value="e_n" /> + <ngram occurrences="37" value="ô_" /> + <ngram occurrences="37" value="_a" /> + <ngram occurrences="36" value="i_" /> + <ngram occurrences="34" value="ën" /> + <ngram occurrences="34" value="te" /> + <ngram occurrences="33" value="th" /> + <ngram occurrences="33" value="hu_" /> + <ngram occurrences="32" value="ny" /> + <ngram occurrences="32" value="_w" /> + <ngram occurrences="31" value="ú" /> + <ngram occurrences="30" value="æ" /> + <ngram occurrences="28" value="yu_" /> + <ngram occurrences="28" value="ty" /> + <ngram occurrences="28" value="t_" /> + <ngram occurrences="27" value="ya" /> + <ngram occurrences="27" value="kë" /> + <ngram occurrences="26" value="ê_" /> + <ngram occurrences="26" value="ni" /> + <ngram occurrences="26" value="_wa" /> + <ngram occurrences="26" value="_kh" /> + <ngram occurrences="25" value="öt" /> + <ngram occurrences="25" value="ët" /> + <ngram occurrences="25" value="wën" /> + <ngram occurrences="25" value="ní" /> + <ngram occurrences="25" value="khu_" /> + <ngram occurrences="25" value="khu" /> + <ngram occurrences="25" value="e_k" /> + <ngram occurrences="24" value="íy" /> + <ngram occurrences="24" value="na" /> + <ngram occurrences="24" value="n_" /> + <ngram occurrences="24" value="_na" /> + <ngram occurrences="24" value="_hu" /> + <ngram occurrences="23" value="yë" /> + <ngram occurrences="23" value="kwa" /> + <ngram occurrences="23" value="e_t" /> + <ngram occurrences="23" value="_ö" /> + <ngram occurrences="23" value="_n_" /> + <ngram occurrences="23" value="_khu_" /> + <ngram occurrences="23" value="_khu" /> + <ngram occurrences="23" value="_ka" /> + <ngram occurrences="22" value="ye" /> + <ngram occurrences="22" value="sh" /> + <ngram occurrences="22" value="sa" /> + <ngram occurrences="21" value="ö_n" /> + <ngram occurrences="21" value="ës" /> + <ngram occurrences="21" value="wa_" /> + <ngram occurrences="21" value="nö_" /> + <ngram occurrences="21" value="ku" /> + <ngram occurrences="21" value="ek" /> + <ngram occurrences="21" value="e_h" /> + <ngram occurrences="21" value="aw" /> + <ngram occurrences="21" value="ae" /> + <ngram occurrences="21" value="_ha" /> + <ngram occurrences="20" value="un" /> + <ngram occurrences="20" value="u_t" /> + <ngram occurrences="20" value="u_n" /> + <ngram occurrences="20" value="u_k" /> + <ngram occurrences="20" value="ta_" /> + <ngram occurrences="20" value="ae_" /> + <ngram occurrences="19" value="ëk" /> + <ngram occurrences="19" value="ëh" /> + <ngram occurrences="19" value="yö" /> + <ngram occurrences="19" value="të" /> + <ngram occurrences="19" value="níy" /> + <ngram occurrences="19" value="në" /> + <ngram occurrences="19" value="ne_k" /> + <ngram occurrences="19" value="iy" /> + <ngram occurrences="19" value="as" /> + <ngram occurrences="19" value="_ta" /> + <ngram occurrences="18" value="íyu" /> + <ngram occurrences="18" value="â" /> + <ngram occurrences="18" value="ut" /> + <ngram occurrences="18" value="us" /> + <ngram occurrences="18" value="té" /> + <ngram occurrences="18" value="ts" /> + <ngram occurrences="18" value="kê" /> + <ngram occurrences="18" value="k_" /> + <ngram occurrences="18" value="e_ne_" /> + <ngram occurrences="18" value="e_ne" /> + <ngram occurrences="18" value="_te" /> + <ngram occurrences="18" value="_ne_k" /> + <ngram occurrences="17" value="íyu_" /> + <ngram occurrences="17" value="ëníyu" /> + <ngram occurrences="17" value="ëníy" /> + <ngram occurrences="17" value="ëní" /> + <ngram occurrences="17" value="ë_n" /> + <ngram occurrences="17" value="ë_k" /> + <ngram occurrences="17" value="ák" /> + <ngram occurrences="17" value="wëníy" /> + <ngram occurrences="17" value="wëní" /> + <ngram occurrences="17" value="níyu_" /> + <ngram occurrences="17" value="níyu" /> + <ngram occurrences="17" value="ne_n" /> + <ngram occurrences="17" value="nae_" /> + <ngram occurrences="17" value="nae" /> + <ngram occurrences="17" value="_ö_" /> + <ngram occurrences="17" value="_ne_n" /> + <ngram occurrences="17" value="_nae_" /> + <ngram occurrences="17" value="_nae" /> + <ngram occurrences="16" value="st" /> + <ngram occurrences="16" value="si" /> + <ngram occurrences="16" value="nô" /> + <ngram occurrences="16" value="ne_t" /> + <ngram occurrences="16" value="awë" /> + <ngram occurrences="16" value="a_t" /> + <ngram occurrences="16" value="_u_" /> + <ngram occurrences="16" value="_ne_t" /> + <ngram occurrences="16" value="_kë" /> + <ngram occurrences="15" value="ôt" /> + <ngram occurrences="15" value="ôk" /> + <ngram occurrences="15" value="ës_" /> + <ngram occurrences="15" value="ëhs" /> + <ngram occurrences="15" value="êt" /> + <ngram occurrences="15" value="é_" /> + <ngram occurrences="15" value="wá" /> + <ngram occurrences="15" value="ke" /> + <ngram occurrences="15" value="an" /> + <ngram occurrences="15" value="ah" /> + <ngram occurrences="15" value="_un" /> + <ngram occurrences="15" value="_sh" /> + <ngram occurrences="14" value="én" /> + <ngram occurrences="14" value="æ_" /> + <ngram occurrences="14" value="á_" /> + <ngram occurrences="14" value="yô" /> + <ngram occurrences="14" value="t_n" /> + <ngram occurrences="14" value="ne_h" /> + <ngram occurrences="14" value="hô" /> + <ngram occurrences="14" value="ay" /> + <ngram occurrences="14" value="a_u" /> + <ngram occurrences="14" value="_ne_h" /> + <ngram occurrences="13" value="â_" /> + <ngram occurrences="13" value="án" /> + <ngram occurrences="13" value="we" /> + <ngram occurrences="13" value="tö" /> + <ngram occurrences="13" value="tê" /> + <ngram occurrences="13" value="sat" /> + <ngram occurrences="13" value="nâ_" /> + <ngram occurrences="13" value="nâ" /> + <ngram occurrences="13" value="kës_" /> + <ngram occurrences="13" value="kës" /> + <ngram occurrences="13" value="he" /> + <ngram occurrences="13" value="awëní" /> + <ngram occurrences="13" value="awën" /> + <ngram occurrences="13" value="a_k" /> + <ngram occurrences="13" value="_të" /> + <ngram occurrences="13" value="_t_" /> + <ngram occurrences="13" value="_nâ_" /> + <ngram occurrences="13" value="_nâ" /> + <ngram occurrences="12" value="ök" /> + <ngram occurrences="12" value="ô_n" /> + <ngram occurrences="12" value="í_" /> + <ngram occurrences="12" value="ëë" /> + <ngram occurrences="12" value="ënö" /> + <ngram occurrences="12" value="ék" /> + <ngram occurrences="12" value="yô_" /> + <ngram occurrences="12" value="yá" /> + <ngram occurrences="12" value="tw" /> + <ngram occurrences="12" value="tak" /> + <ngram occurrences="12" value="sy" /> + <ngram occurrences="12" value="s_n" /> + <ngram occurrences="12" value="në_" /> + <ngram occurrences="12" value="n_a" /> + <ngram occurrences="12" value="kwa_" /> + <ngram occurrences="12" value="ik" /> + <ngram occurrences="12" value="ht" /> + <ngram occurrences="12" value="ey" /> + <ngram occurrences="12" value="e_u" /> + <ngram occurrences="12" value="akw" /> + <ngram occurrences="12" value="_ëk" /> + <ngram occurrences="12" value="_ni" /> + <ngram occurrences="12" value="_n_a" /> + <ngram occurrences="12" value="_kw" /> + <ngram occurrences="12" value="_aw" /> + <ngram occurrences="11" value="ö_k" /> + <ngram occurrences="11" value="wë_" /> + <ngram occurrences="11" value="wé" /> + <ngram occurrences="11" value="we_" /> + <ngram occurrences="11" value="ui" /> + <ngram occurrences="11" value="u_ë" /> + <ngram occurrences="11" value="u_ne" /> + <ngram occurrences="11" value="te_" /> + <ngram occurrences="11" value="niy" /> + <ngram occurrences="11" value="kê_" /> + <ngram occurrences="11" value="i_t" /> + <ngram occurrences="11" value="hö" /> + <ngram occurrences="11" value="hô_" /> + <ngram occurrences="11" value="hu_n" /> + <ngram occurrences="11" value="hsa" /> + <ngram occurrences="11" value="ha_" /> + <ngram occurrences="11" value="_ú" /> + <ngram occurrences="11" value="_ëhs" /> + <ngram occurrences="11" value="_ëh" /> + <ngram occurrences="10" value="ún" /> + <ngram occurrences="10" value="öh" /> + <ngram occurrences="10" value="ên" /> + <ngram occurrences="10" value="ææ" /> + <ngram occurrences="10" value="ya_" /> + <ngram occurrences="10" value="wö" /> + <ngram occurrences="10" value="wat" /> + <ngram occurrences="10" value="uw" /> + <ngram occurrences="10" value="uk" /> + <ngram occurrences="10" value="uikê_" /> + <ngram occurrences="10" value="uikê" /> + <ngram occurrences="10" value="uik" /> + <ngram occurrences="10" value="tö_" /> + <ngram occurrences="10" value="tk" /> + <ngram occurrences="10" value="ti" /> + <ngram occurrences="10" value="sk" /> + <ngram occurrences="10" value="ne_ne" /> + <ngram occurrences="10" value="kan" /> + <ngram occurrences="10" value="k_n" /> + <ngram occurrences="10" value="ikê_" /> + <ngram occurrences="10" value="ikê" /> + <ngram occurrences="10" value="hë" /> + <ngram occurrences="10" value="huikê" /> + <ngram occurrences="10" value="huik" /> + <ngram occurrences="10" value="hui" /> + <ngram occurrences="10" value="e_wa" /> + <ngram occurrences="10" value="e_w" /> + <ngram occurrences="10" value="e_hu" /> + <ngram occurrences="10" value="ai" /> + <ngram occurrences="10" value="aa" /> + <ngram occurrences="10" value="_á" /> + <ngram occurrences="10" value="_y" /> + <ngram occurrences="10" value="_ut" /> + <ngram occurrences="10" value="_ta_" /> + <ngram occurrences="10" value="_kës_" /> + <ngram occurrences="10" value="_kës" /> + <ngram occurrences="10" value="_huik" /> + <ngram occurrences="10" value="_hui" /> + <ngram occurrences="9" value="ös" /> + <ngram occurrences="9" value="ö_ne_" /> + <ngram occurrences="9" value="ö_ne" /> + <ngram occurrences="9" value="ë_t" /> + <ngram occurrences="9" value="ê_n" /> + <ngram occurrences="9" value="yë_" /> + <ngram occurrences="9" value="yê" /> + <ngram occurrences="9" value="u_ne_" /> + <ngram occurrences="9" value="sn" /> + <ngram occurrences="9" value="si_" /> + <ngram occurrences="9" value="s_ë" /> + <ngram occurrences="9" value="nöt" /> + <ngram occurrences="9" value="ne_hu" /> + <ngram occurrences="9" value="n_aw" /> + <ngram occurrences="9" value="kö" /> + <ngram occurrences="9" value="kææ" /> + <ngram occurrences="9" value="kæ" /> + <ngram occurrences="9" value="ku_" /> + <ngram occurrences="9" value="khu_n" /> + <ngram occurrences="9" value="ka_" /> + <ngram occurrences="9" value="hsat" /> + <ngram occurrences="9" value="he_" /> + <ngram occurrences="9" value="ekh" /> + <ngram occurrences="9" value="eh" /> + <ngram occurrences="9" value="e_s" /> + <ngram occurrences="9" value="aty" /> + <ngram occurrences="9" value="a_s" /> + <ngram occurrences="9" value="_ö_n" /> + <ngram occurrences="9" value="_ô" /> + <ngram occurrences="9" value="_ëë" /> + <ngram occurrences="9" value="_ët" /> + <ngram occurrences="9" value="_té" /> + <ngram occurrences="9" value="_n_aw" /> + <ngram occurrences="9" value="_kan" /> + <ngram occurrences="9" value="_hë" /> + <ngram occurrences="9" value="_awë" /> + <ngram occurrences="9" value="_ak" /> + <ngram occurrences="8" value="öte" /> + <ngram occurrences="8" value="ö_h" /> + <ngram occurrences="8" value="ô_ë" /> + <ngram occurrences="8" value="ye_" /> + <ngram occurrences="8" value="wöt" /> + <ngram occurrences="8" value="wai_" /> + <ngram occurrences="8" value="wai" /> + <ngram occurrences="8" value="ust" /> + <ngram occurrences="8" value="unö" /> + <ngram occurrences="8" value="unë" /> + <ngram occurrences="8" value="tá" /> + <ngram occurrences="8" value="twa" /> + <ngram occurrences="8" value="ths" /> + <ngram occurrences="8" value="tey" /> + <ngram occurrences="8" value="tek" /> + <ngram occurrences="8" value="t_ne_" /> + <ngram occurrences="8" value="t_ne" /> + <ngram occurrences="8" value="shô_" /> + <ngram occurrences="8" value="shô" /> + <ngram occurrences="8" value="se" /> + <ngram occurrences="8" value="nyu" /> + <ngram occurrences="8" value="nek" /> + <ngram occurrences="8" value="n_awë" /> + <ngram occurrences="8" value="kë_" /> + <ngram occurrences="8" value="kwë" /> + <ngram occurrences="8" value="kwá" /> + <ngram occurrences="8" value="kwe_" /> + <ngram occurrences="8" value="kwe" /> + <ngram occurrences="8" value="k_ne_" /> + <ngram occurrences="8" value="k_ne" /> + <ngram occurrences="8" value="i_n" /> + <ngram occurrences="8" value="hu_k" /> + <ngram occurrences="8" value="hsi" /> + <ngram occurrences="8" value="e_te" /> + <ngram occurrences="8" value="as_" /> + <ngram occurrences="8" value="ai_" /> + <ngram occurrences="8" value="_ún" /> + <ngram occurrences="8" value="_wai_" /> + <ngram occurrences="8" value="_wai" /> + <ngram occurrences="8" value="_unë" /> + <ngram occurrences="8" value="_te_" /> + <ngram occurrences="8" value="_t_n" /> + <ngram occurrences="8" value="_shô_" /> + <ngram occurrences="8" value="_shô" /> + <ngram occurrences="8" value="_ha_" /> + <ngram occurrences="8" value="_awën" /> + <ngram occurrences="7" value="öë" /> + <ngram occurrences="7" value="ö_s" /> + <ngram occurrences="7" value="ôt_" /> + <ngram occurrences="7" value="ôn" /> + <ngram occurrences="7" value="ôk_" /> + <ngram occurrences="7" value="ëö" /> + <ngram occurrences="7" value="ëy" /> + <ngram occurrences="7" value="ëka" /> + <ngram occurrences="7" value="ë_ë" /> + <ngram occurrences="7" value="êth" /> + <ngram occurrences="7" value="ææ_" /> + <ngram occurrences="7" value="yô_n" /> + <ngram occurrences="7" value="yêt" /> + <ngram occurrences="7" value="yé" /> + <ngram occurrences="7" value="ya_t" /> + <ngram occurrences="7" value="wá_" /> + <ngram occurrences="7" value="wi" /> + <ngram occurrences="7" value="unë_" /> + <ngram occurrences="7" value="u_tê_" /> + <ngram occurrences="7" value="u_tê" /> + <ngram occurrences="7" value="u_t_" /> + <ngram occurrences="7" value="tú" /> + <ngram occurrences="7" value="të_" /> + <ngram occurrences="7" value="tê_" /> + <ngram occurrences="7" value="tsi" /> + <ngram occurrences="7" value="ta_un" /> + <ngram occurrences="7" value="ta_u" /> + <ngram occurrences="7" value="nyu_" /> + <ngram occurrences="7" value="nya" /> + <ngram occurrences="7" value="niyu" /> + <ngram occurrences="7" value="na_u_" /> + <ngram occurrences="7" value="na_u" /> + <ngram occurrences="7" value="na_" /> + <ngram occurrences="7" value="kwé" /> + <ngram occurrences="7" value="kn" /> + <ngram occurrences="7" value="iyu" /> + <ngram occurrences="7" value="hö_" /> +</ngrams> diff --git a/src/plugins/language/nepali.klp b/src/plugins/language/nepali.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1100" value="_" /> + <ngram occurrences="627" value="f" /> + <ngram occurrences="375" value="f_" /> + <ngram occurrences="261" value="l" /> + <ngram occurrences="253" value="g" /> + <ngram occurrences="200" value="s" /> + <ngram occurrences="169" value="d" /> + <ngram occurrences="149" value="k" /> + <ngram occurrences="149" value="g_" /> + <ngram occurrences="127" value="sf" /> + <ngram occurrences="126" value="n" /> + <ngram occurrences="126" value="_l" /> + <ngram occurrences="121" value="t" /> + <ngram occurrences="115" value="sf_" /> + <ngram occurrences="107" value="_s" /> + <ngram occurrences="101" value="j" /> + <ngram occurrences="99" value="_f" /> + <ngram occurrences="97" value="_k" /> + <ngram occurrences="88" value="o" /> + <ngram occurrences="86" value="_d" /> + <ngram occurrences="84" value="u" /> + <ngram occurrences="82" value="x" /> + <ngram occurrences="81" value="b" /> + <ngram occurrences="77" value="l_" /> + <ngram occurrences="69" value="_sf" /> + <ngram occurrences="67" value="_g" /> + <ngram occurrences="66" value="df" /> + <ngram occurrences="65" value="a" /> + <ngram occurrences="61" value="p" /> + <ngram occurrences="59" value="e" /> + <ngram occurrences="59" value="_sf_" /> + <ngram occurrences="56" value="_u" /> + <ngram occurrences="55" value="_f_" /> + <ngram occurrences="52" value="df_" /> + <ngram occurrences="52" value="_t" /> + <ngram occurrences="51" value="k_" /> + <ngram occurrences="51" value="_g_" /> + <ngram occurrences="50" value="n_" /> + <ngram occurrences="50" value="c" /> + <ngram occurrences="50" value="_c" /> + <ngram occurrences="46" value="f_l" /> + <ngram occurrences="45" value="s_" /> + <ngram occurrences="44" value="_e" /> + <ngram occurrences="42" value="x_" /> + <ngram occurrences="42" value="u_" /> + <ngram occurrences="42" value="t_" /> + <ngram occurrences="42" value="o_" /> + <ngram occurrences="41" value="h" /> + <ngram occurrences="40" value="tf" /> + <ngram occurrences="38" value="_a" /> + <ngram occurrences="37" value="m" /> + <ngram occurrences="37" value="b_" /> + <ngram occurrences="36" value="r" /> + <ngram occurrences="35" value="kf" /> + <ngram occurrences="35" value="f_d" /> + <ngram occurrences="34" value="fn" /> + <ngram occurrences="34" value="f_s" /> + <ngram occurrences="34" value="f_k" /> + <ngram occurrences="34" value="_n" /> + <ngram occurrences="34" value="_k_" /> + <ngram occurrences="33" value="lg" /> + <ngram occurrences="33" value="_x" /> + <ngram occurrences="32" value="_b" /> + <ngram occurrences="31" value="d_" /> + <ngram occurrences="31" value="_df" /> + <ngram occurrences="30" value="_h" /> + <ngram occurrences="29" value="lj" /> + <ngram occurrences="29" value="_p" /> + <ngram occurrences="28" value="_u_" /> + <ngram occurrences="27" value="q" /> + <ngram occurrences="27" value="jf" /> + <ngram occurrences="27" value="f_u" /> + <ngram occurrences="27" value="_s_" /> + <ngram occurrences="26" value="f_f" /> + <ngram occurrences="25" value="gf" /> + <ngram occurrences="25" value="_lj" /> + <ngram occurrences="25" value="_j" /> + <ngram occurrences="24" value="nf" /> + <ngram occurrences="24" value="kl" /> + <ngram occurrences="24" value="cf" /> + <ngram occurrences="24" value="_cf" /> + <ngram occurrences="23" value="_r" /> + <ngram occurrences="23" value="_kf" /> + <ngram occurrences="23" value="_df_" /> + <ngram occurrences="22" value="tf_" /> + <ngram occurrences="22" value="of" /> + <ngram occurrences="22" value="fo" /> + <ngram occurrences="22" value="f_sf" /> + <ngram occurrences="22" value="_o" /> + <ngram occurrences="21" value="z" /> + <ngram occurrences="21" value="fk" /> + <ngram occurrences="21" value="fg" /> + <ngram occurrences="21" value="fd" /> + <ngram occurrences="21" value="af" /> + <ngram occurrences="21" value="_kl" /> + <ngram occurrences="20" value="j_" /> + <ngram occurrences="20" value="_tf" /> + <ngram occurrences="19" value="w" /> + <ngram occurrences="19" value="ps" /> + <ngram occurrences="19" value="g_k" /> + <ngram occurrences="19" value="fl" /> + <ngram occurrences="18" value="y" /> + <ngram occurrences="18" value="i" /> + <ngram occurrences="18" value="gf_" /> + <ngram occurrences="18" value="g_f" /> + <ngram occurrences="18" value="f_f_" /> + <ngram occurrences="18" value="_l_" /> + <ngram occurrences="17" value="xf" /> + <ngram occurrences="17" value="sf_l" /> + <ngram occurrences="17" value="fj" /> + <ngram occurrences="17" value="f_u_" /> + <ngram occurrences="17" value="f_sf_" /> + <ngram occurrences="17" value="f_e" /> + <ngram occurrences="17" value="_t_" /> + <ngram occurrences="16" value="of_" /> + <ngram occurrences="16" value="fs" /> + <ngram occurrences="16" value="f_h" /> + <ngram occurrences="16" value="f_g" /> + <ngram occurrences="16" value="a_" /> + <ngram occurrences="16" value="_x_" /> + <ngram occurrences="15" value="lg_" /> + <ngram occurrences="15" value="km" /> + <ngram occurrences="15" value="g_l" /> + <ngram occurrences="15" value="fo_" /> + <ngram occurrences="15" value="f_n" /> + <ngram occurrences="15" value="ef" /> + <ngram occurrences="15" value="dg" /> + <ngram occurrences="14" value="lx" /> + <ngram occurrences="14" value="lt" /> + <ngram occurrences="14" value="if" /> + <ngram occurrences="14" value="fx" /> + <ngram occurrences="14" value="fu" /> + <ngram occurrences="14" value="f_t" /> + <ngram occurrences="14" value="f_k_" /> + <ngram occurrences="14" value="f_c" /> + <ngram occurrences="14" value="f_b" /> + <ngram occurrences="14" value="cg" /> + <ngram occurrences="14" value="af_" /> + <ngram occurrences="14" value="_o_" /> + <ngram occurrences="14" value="_lg" /> + <ngram occurrences="14" value="_d_" /> + <ngram occurrences="14" value="_cg" /> + <ngram occurrences="13" value="x_s" /> + <ngram occurrences="13" value="v" /> + <ngram occurrences="13" value="sf_s" /> + <ngram occurrences="13" value="ln" /> + <ngram occurrences="13" value="jf_" /> + <ngram occurrences="13" value="gb" /> + <ngram occurrences="13" value="fsf_" /> + <ngram occurrences="13" value="fsf" /> + <ngram occurrences="13" value="f_df" /> + <ngram occurrences="13" value="ep" /> + <ngram occurrences="13" value="_n_" /> + <ngram occurrences="13" value="_ep" /> + <ngram occurrences="13" value="_b_" /> + <ngram occurrences="13" value="_a_" /> + <ngram occurrences="12" value="ug" /> + <ngram occurrences="12" value="rg" /> + <ngram occurrences="12" value="psf_" /> + <ngram occurrences="12" value="psf" /> + <ngram occurrences="12" value="m_" /> + <ngram occurrences="12" value="klg_" /> + <ngram occurrences="12" value="klg" /> + <ngram occurrences="12" value="g_f_" /> + <ngram occurrences="12" value="fn_" /> + <ngram occurrences="12" value="f_x" /> + <ngram occurrences="12" value="f_s_" /> + <ngram occurrences="12" value="_klg_" /> + <ngram occurrences="12" value="_klg" /> + <ngram occurrences="12" value="_jf" /> + <ngram occurrences="12" value="_ef" /> + <ngram occurrences="11" value="ug_" /> + <ngram occurrences="11" value="to" /> + <ngram occurrences="11" value="sf_u" /> + <ngram occurrences="11" value="rf" /> + <ngram occurrences="11" value="ql" /> + <ngram occurrences="11" value="nl" /> + <ngram occurrences="11" value="ld" /> + <ngram occurrences="11" value="lb" /> + <ngram occurrences="11" value="kf_" /> + <ngram occurrences="11" value="hg" /> + <ngram occurrences="11" value="hf" /> + <ngram occurrences="11" value="gql" /> + <ngram occurrences="11" value="gq" /> + <ngram occurrences="11" value="g_s" /> + <ngram occurrences="11" value="g_g" /> + <ngram occurrences="11" value="fb" /> + <ngram occurrences="11" value="eps" /> + <ngram occurrences="11" value="dl" /> + <ngram occurrences="11" value="dgql" /> + <ngram occurrences="11" value="dgq" /> + <ngram occurrences="11" value="de" /> + <ngram occurrences="11" value="cg_" /> + <ngram occurrences="11" value="bf" /> + <ngram occurrences="11" value="_ug_" /> + <ngram occurrences="11" value="_ug" /> + <ngram occurrences="11" value="_rg" /> + <ngram occurrences="11" value="_rf" /> + <ngram occurrences="11" value="_eps" /> + <ngram occurrences="11" value="_cg_" /> + <ngram occurrences="11" value="_af" /> + <ngram occurrences="10" value="yf" /> + <ngram occurrences="10" value="x_sf_" /> + <ngram occurrences="10" value="x_sf" /> + <ngram occurrences="10" value="w_" /> + <ngram occurrences="10" value="tfj" /> + <ngram occurrences="10" value="sf_u_" /> + <ngram occurrences="10" value="nd" /> + <ngram occurrences="10" value="lr" /> + <ngram occurrences="10" value="l_c" /> + <ngram occurrences="10" value="kl_" /> + <ngram occurrences="10" value="kfn" /> + <ngram occurrences="10" value="k_t" /> + <ngram occurrences="10" value="gd" /> + <ngram occurrences="10" value="gb_" /> + <ngram occurrences="10" value="fx_" /> + <ngram occurrences="10" value="fp" /> + <ngram occurrences="10" value="f_r" /> + <ngram occurrences="10" value="f_p" /> + <ngram occurrences="10" value="f_l_" /> + <ngram occurrences="10" value="f_g_" /> + <ngram occurrences="10" value="f_df_" /> + <ngram occurrences="10" value="f_a" /> + <ngram occurrences="10" value="bg" /> + <ngram occurrences="10" value="_z" /> + <ngram occurrences="10" value="_tf_" /> + <ngram occurrences="10" value="_sf_u" /> + <ngram occurrences="10" value="_sf_l" /> + <ngram occurrences="10" value="_nf" /> + <ngram occurrences="10" value="_g_k" /> + <ngram occurrences="10" value="_f_l" /> + <ngram occurrences="9" value="sf_sf" /> + <ngram occurrences="9" value="sf_d" /> + <ngram occurrences="9" value="nl_" /> + <ngram occurrences="9" value="ls" /> + <ngram occurrences="9" value="g_kfn" /> + <ngram occurrences="9" value="g_kf" /> + <ngram occurrences="9" value="g_d" /> + <ngram occurrences="9" value="fk_" /> + <ngram occurrences="9" value="fg_" /> + <ngram occurrences="9" value="f_kl" /> + <ngram occurrences="9" value="epsf_" /> + <ngram occurrences="9" value="epsf" /> + <ngram occurrences="9" value="da" /> + <ngram occurrences="9" value="bf_" /> + <ngram occurrences="9" value="_lt" /> + <ngram occurrences="9" value="_ld" /> + <ngram occurrences="9" value="_lb" /> + <ngram occurrences="9" value="_kfn" /> + <ngram occurrences="9" value="_k_t" /> + <ngram occurrences="9" value="_hg" /> + <ngram occurrences="9" value="_g_kf" /> + <ngram occurrences="9" value="_epsf" /> + <ngram occurrences="9" value="_da" /> + <ngram occurrences="8" value="x_g_" /> + <ngram occurrences="8" value="x_g" /> + <ngram occurrences="8" value="ut" /> + <ngram occurrences="8" value="tfj_" /> + <ngram occurrences="8" value="sf_a" /> + <ngram occurrences="8" value="pg" /> + <ngram occurrences="8" value="nfo_" /> + <ngram occurrences="8" value="nfo" /> + <ngram occurrences="8" value="n_l" /> + <ngram occurrences="8" value="mn" /> + <ngram occurrences="8" value="lx_" /> + <ngram occurrences="8" value="k_tfj" /> + <ngram occurrences="8" value="k_tf" /> + <ngram occurrences="8" value="k_f" /> + <ngram occurrences="8" value="gs" /> + <ngram occurrences="8" value="g_a" /> + <ngram occurrences="8" value="fu_" /> + <ngram occurrences="8" value="fj_" /> + <ngram occurrences="8" value="f_j" /> + <ngram occurrences="8" value="f_d_" /> + <ngram occurrences="8" value="f_cf" /> + <ngram occurrences="8" value="em" /> + <ngram occurrences="8" value="df_f" /> + <ngram occurrences="8" value="df_d" /> + <ngram occurrences="8" value="cg_f_" /> + <ngram occurrences="8" value="cg_f" /> + <ngram occurrences="8" value="_y" /> + <ngram occurrences="8" value="_tfj" /> + <ngram occurrences="8" value="_sf_d" /> + <ngram occurrences="8" value="_kl_" /> + <ngram occurrences="8" value="_k_tf" /> + <ngram occurrences="8" value="_cg_f" /> + <ngram occurrences="7" value="z_" /> + <ngram occurrences="7" value="ul_" /> + <ngram occurrences="7" value="ul" /> + <ngram occurrences="7" value="t_l" /> + <ngram occurrences="7" value="sf_k" /> + <ngram occurrences="7" value="sf_df" /> + <ngram occurrences="7" value="s_d" /> + <ngram occurrences="7" value="rfn" /> + <ngram occurrences="7" value="r_" /> + <ngram occurrences="7" value="qm" /> + <ngram occurrences="7" value="lu" /> + <ngram occurrences="7" value="lk" /> + <ngram occurrences="7" value="l_s" /> + <ngram occurrences="7" value="l_l" /> + <ngram occurrences="7" value="l_k" /> + <ngram occurrences="7" value="jz" /> + <ngram occurrences="7" value="hgf_" /> + <ngram occurrences="7" value="hgf" /> + <ngram occurrences="7" value="h_" /> + <ngram occurrences="7" value="gg" /> + <ngram occurrences="7" value="g_u" /> + <ngram occurrences="7" value="g_t" /> + <ngram occurrences="7" value="fnl" /> + <ngram occurrences="7" value="fdf" /> + <ngram occurrences="7" value="fb_" /> + <ngram occurrences="7" value="f_lj" /> + <ngram occurrences="7" value="f_lg" /> + <ngram occurrences="7" value="f_klg" /> + <ngram occurrences="7" value="eg" /> + <ngram occurrences="7" value="e_" /> + <ngram occurrences="7" value="dt" /> + <ngram occurrences="7" value="bg_" /> + <ngram occurrences="7" value="b_a" /> + <ngram occurrences="7" value="_yf" /> + <ngram occurrences="7" value="_x_g_" /> + <ngram occurrences="7" value="_x_g" /> + <ngram occurrences="7" value="_w" /> + <ngram occurrences="7" value="_v" /> + <ngram occurrences="7" value="_rfn" /> + <ngram occurrences="7" value="_m" /> + <ngram occurrences="7" value="_lr" /> + <ngram occurrences="7" value="_ln" /> + <ngram occurrences="7" value="_hgf_" /> + <ngram occurrences="7" value="_hgf" /> + <ngram occurrences="7" value="_hf" /> + <ngram occurrences="7" value="_fk" /> + <ngram occurrences="7" value="_eg" /> + <ngram occurrences="7" value="_dg" /> + <ngram occurrences="7" value="_de" /> + <ngram occurrences="7" value="_af_" /> + <ngram occurrences="6" value="zj" /> + <ngram occurrences="6" value="xf_" /> + <ngram occurrences="6" value="wf" /> + <ngram occurrences="6" value="v_" /> + <ngram occurrences="6" value="ut_" /> + <ngram occurrences="6" value="uf" /> + <ngram occurrences="6" value="u_l" /> + <ngram occurrences="6" value="ts" /> + <ngram occurrences="6" value="tof" /> + <ngram occurrences="6" value="sf_lg" /> + <ngram occurrences="6" value="sf_l_" /> + <ngram occurrences="6" value="s_g_" /> + <ngram occurrences="6" value="s_g" /> + <ngram occurrences="6" value="s_f" /> + <ngram occurrences="6" value="rj" /> + <ngram occurrences="6" value="rgb" /> + <ngram occurrences="6" value="ql_" /> + <ngram occurrences="6" value="pk" /> + <ngram occurrences="6" value="pg_" /> + <ngram occurrences="6" value="o_l" /> + <ngram occurrences="6" value="nsf_" /> + <ngram occurrences="6" value="nsf" /> + <ngram occurrences="6" value="ns" /> + <ngram occurrences="6" value="ng_" /> + <ngram occurrences="6" value="ng" /> + <ngram occurrences="6" value="n_s" /> + <ngram occurrences="6" value="mtf" /> + <ngram occurrences="6" value="mt" /> + <ngram occurrences="6" value="mf_" /> + <ngram occurrences="6" value="mf" /> + <ngram occurrences="6" value="lrj" /> + <ngram occurrences="6" value="ljzj" /> + <ngram occurrences="6" value="ljz" /> + <ngram occurrences="6" value="ljjf" /> + <ngram occurrences="6" value="ljj" /> + <ngram occurrences="6" value="la" /> + <ngram occurrences="6" value="l_sf" /> + <ngram occurrences="6" value="l_f" /> + <ngram occurrences="6" value="l_d" /> + <ngram occurrences="6" value="l_cf" /> + <ngram occurrences="6" value="kmtf" /> + <ngram occurrences="6" value="kmt" /> + <ngram occurrences="6" value="kmn" /> + <ngram occurrences="6" value="kg" /> + <ngram occurrences="6" value="k_l" /> + <ngram occurrences="6" value="k_k" /> + <ngram occurrences="6" value="jzj" /> + <ngram occurrences="6" value="jl" /> + <ngram occurrences="6" value="jjf" /> + <ngram occurrences="6" value="jj" /> + <ngram occurrences="6" value="jfx" /> + <ngram occurrences="6" value="hf_" /> + <ngram occurrences="6" value="gsf_" /> + <ngram occurrences="6" value="gsf" /> + <ngram occurrences="6" value="gql_" /> + <ngram occurrences="6" value="go" /> + <ngram occurrences="6" value="gl" /> + <ngram occurrences="6" value="g_r" /> + <ngram occurrences="6" value="g_p" /> + <ngram occurrences="6" value="g_g_" /> + <ngram occurrences="6" value="g_c" /> + <ngram occurrences="6" value="fpg_" /> + <ngram occurrences="6" value="fpg" /> + <ngram occurrences="6" value="fnl_" /> +</ngrams> diff --git a/src/plugins/language/norwegian.klp b/src/plugins/language/norwegian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="894" value="_" /> + <ngram occurrences="586" value="e" /> + <ngram occurrences="395" value="n" /> + <ngram occurrences="304" value="r" /> + <ngram occurrences="271" value="t" /> + <ngram occurrences="249" value="a" /> + <ngram occurrences="219" value="s" /> + <ngram occurrences="200" value="o" /> + <ngram occurrences="177" value="l" /> + <ngram occurrences="175" value="i" /> + <ngram occurrences="172" value="n_" /> + <ngram occurrences="161" value="r_" /> + <ngram occurrences="154" value="g" /> + <ngram occurrences="150" value="k" /> + <ngram occurrences="145" value="h" /> + <ngram occurrences="138" value="en" /> + <ngram occurrences="138" value="e_" /> + <ngram occurrences="136" value="d" /> + <ngram occurrences="134" value="_h" /> + <ngram occurrences="132" value="m" /> + <ngram occurrences="116" value="er" /> + <ngram occurrences="113" value="t_" /> + <ngram occurrences="100" value="v" /> + <ngram occurrences="99" value="_s" /> + <ngram occurrences="94" value="er_" /> + <ngram occurrences="89" value="an" /> + <ngram occurrences="88" value="u" /> + <ngram occurrences="88" value="en_" /> + <ngram occurrences="80" value="ha" /> + <ngram occurrences="79" value="_ha" /> + <ngram occurrences="75" value="f" /> + <ngram occurrences="71" value="g_" /> + <ngram occurrences="66" value="de" /> + <ngram occurrences="66" value="_e" /> + <ngram occurrences="64" value="å" /> + <ngram occurrences="64" value="p" /> + <ngram occurrences="63" value="_d" /> + <ngram occurrences="60" value="_o" /> + <ngram occurrences="59" value="te" /> + <ngram occurrences="57" value="et" /> + <ngram occurrences="55" value="_f" /> + <ngram occurrences="54" value="or" /> + <ngram occurrences="52" value="ne" /> + <ngram occurrences="50" value="an_" /> + <ngram occurrences="49" value="et_" /> + <ngram occurrences="47" value="_i" /> + <ngram occurrences="46" value="han" /> + <ngram occurrences="46" value="_han" /> + <ngram occurrences="44" value="nn" /> + <ngram occurrences="43" value="å_" /> + <ngram occurrences="43" value="ke" /> + <ngram occurrences="43" value="_de" /> + <ngram occurrences="41" value="m_" /> + <ngram occurrences="41" value="han_" /> + <ngram occurrences="41" value="_han_" /> + <ngram occurrences="40" value="se" /> + <ngram occurrences="40" value="_v" /> + <ngram occurrences="40" value="_m" /> + <ngram occurrences="39" value="re" /> + <ngram occurrences="39" value="og" /> + <ngram occurrences="39" value="b" /> + <ngram occurrences="38" value="st" /> + <ngram occurrences="38" value="om" /> + <ngram occurrences="38" value="me" /> + <ngram occurrences="38" value="_og" /> + <ngram occurrences="37" value="og_" /> + <ngram occurrences="37" value="ar" /> + <ngram occurrences="37" value="_og_" /> + <ngram occurrences="36" value="un" /> + <ngram occurrences="35" value="_t" /> + <ngram occurrences="34" value="in" /> + <ngram occurrences="34" value="ge" /> + <ngram occurrences="34" value="fo" /> + <ngram occurrences="34" value="el" /> + <ngram occurrences="34" value="_k" /> + <ngram occurrences="33" value="for" /> + <ngram occurrences="32" value="ng" /> + <ngram occurrences="32" value="_a" /> + <ngram occurrences="31" value="j" /> + <ngram occurrences="30" value="ø" /> + <ngram occurrences="30" value="i_" /> + <ngram occurrences="30" value="_for" /> + <ngram occurrences="30" value="_fo" /> + <ngram occurrences="29" value="l_" /> + <ngram occurrences="29" value="il" /> + <ngram occurrences="29" value="_er_" /> + <ngram occurrences="29" value="_er" /> + <ngram occurrences="28" value="sk" /> + <ngram occurrences="28" value="om_" /> + <ngram occurrences="28" value="le" /> + <ngram occurrences="28" value="_b" /> + <ngram occurrences="27" value="r_h" /> + <ngram occurrences="27" value="_n" /> + <ngram occurrences="27" value="_g" /> + <ngram occurrences="26" value="ve" /> + <ngram occurrences="26" value="ne_" /> + <ngram occurrences="26" value="n_h" /> + <ngram occurrences="25" value="ti" /> + <ngram occurrences="25" value="kk" /> + <ngram occurrences="25" value="al" /> + <ngram occurrences="24" value="e_h" /> + <ngram occurrences="24" value="ar_" /> + <ngram occurrences="23" value="li" /> + <ngram occurrences="23" value="hu" /> + <ngram occurrences="23" value="es" /> + <ngram occurrences="23" value="_p" /> + <ngram occurrences="22" value="va" /> + <ngram occurrences="22" value="tt" /> + <ngram occurrences="22" value="te_" /> + <ngram occurrences="22" value="t_h" /> + <ngram occurrences="22" value="or_" /> + <ngram occurrences="22" value="nne" /> + <ngram occurrences="22" value="kke" /> + <ngram occurrences="22" value="det" /> + <ngram occurrences="21" value="y" /> + <ngram occurrences="21" value="rt" /> + <ngram occurrences="21" value="n_ha" /> + <ngram occurrences="21" value="is" /> + <ngram occurrences="21" value="det_" /> + <ngram occurrences="21" value="at" /> + <ngram occurrences="21" value="_se" /> + <ngram occurrences="21" value="_hu" /> + <ngram occurrences="20" value="so" /> + <ngram occurrences="20" value="r_s" /> + <ngram occurrences="20" value="ke_" /> + <ngram occurrences="20" value="for_" /> + <ngram occurrences="20" value="eg" /> + <ngram occurrences="20" value="d_" /> + <ngram occurrences="20" value="_me" /> + <ngram occurrences="19" value="vi" /> + <ngram occurrences="19" value="un_" /> + <ngram occurrences="19" value="hun_" /> + <ngram occurrences="19" value="hun" /> + <ngram occurrences="19" value="ed" /> + <ngram occurrences="19" value="_u" /> + <ngram occurrences="19" value="_so" /> + <ngram occurrences="19" value="_r" /> + <ngram occurrences="19" value="_l" /> + <ngram occurrences="19" value="_hun_" /> + <ngram occurrences="19" value="_hun" /> + <ngram occurrences="18" value="ør" /> + <ngram occurrences="18" value="pe" /> + <ngram occurrences="18" value="nge" /> + <ngram occurrences="18" value="n_s" /> + <ngram occurrences="18" value="ka" /> + <ngram occurrences="18" value="je" /> + <ngram occurrences="18" value="il_" /> + <ngram occurrences="18" value="he" /> + <ngram occurrences="18" value="de_" /> + <ngram occurrences="17" value="som" /> + <ngram occurrences="17" value="s_" /> + <ngram occurrences="17" value="ll" /> + <ngram occurrences="17" value="har_" /> + <ngram occurrences="17" value="har" /> + <ngram occurrences="17" value="_i_" /> + <ngram occurrences="17" value="_har_" /> + <ngram occurrences="17" value="_har" /> + <ngram occurrences="17" value="_for_" /> + <ngram occurrences="17" value="_det" /> + <ngram occurrences="16" value="til" /> + <ngram occurrences="16" value="ter" /> + <ngram occurrences="16" value="ste" /> + <ngram occurrences="16" value="som_" /> + <ngram occurrences="16" value="r_d" /> + <ngram occurrences="16" value="la" /> + <ngram occurrences="16" value="ig" /> + <ngram occurrences="16" value="g_s" /> + <ngram occurrences="16" value="er_h" /> + <ngram occurrences="16" value="e_s" /> + <ngram occurrences="16" value="_ti" /> + <ngram occurrences="16" value="_som_" /> + <ngram occurrences="16" value="_som" /> + <ngram occurrences="16" value="_en" /> + <ngram occurrences="16" value="_det_" /> + <ngram occurrences="15" value="ns" /> + <ngram occurrences="15" value="ik" /> + <ngram occurrences="15" value="eg_" /> + <ngram occurrences="15" value="am" /> + <ngram occurrences="15" value="_å" /> + <ngram occurrences="15" value="_til" /> + <ngram occurrences="14" value="v_" /> + <ngram occurrences="14" value="til_" /> + <ngram occurrences="14" value="ten" /> + <ngram occurrences="14" value="ta" /> + <ngram occurrences="14" value="t_ha" /> + <ngram occurrences="14" value="t_e" /> + <ngram occurrences="14" value="på_" /> + <ngram occurrences="14" value="på" /> + <ngram occurrences="14" value="nt" /> + <ngram occurrences="14" value="nd" /> + <ngram occurrences="14" value="n_m" /> + <ngram occurrences="14" value="kke_" /> + <ngram occurrences="14" value="ikk" /> + <ngram occurrences="14" value="gen" /> + <ngram occurrences="14" value="er_s" /> + <ngram occurrences="14" value="enn" /> + <ngram occurrences="14" value="av" /> + <ngram occurrences="14" value="a_" /> + <ngram occurrences="14" value="_på_" /> + <ngram occurrences="14" value="_på" /> + <ngram occurrences="13" value="år" /> + <ngram occurrences="13" value="ut" /> + <ngram occurrences="13" value="re_" /> + <ngram occurrences="13" value="on" /> + <ngram occurrences="13" value="no" /> + <ngram occurrences="13" value="n_e" /> + <ngram occurrences="13" value="mme" /> + <ngram occurrences="13" value="mm" /> + <ngram occurrences="13" value="ene" /> + <ngram occurrences="13" value="en_h" /> + <ngram occurrences="13" value="_til_" /> + <ngram occurrences="13" value="_ka" /> + <ngram occurrences="13" value="_in" /> + <ngram occurrences="13" value="_he" /> + <ngram occurrences="12" value="år_" /> + <ngram occurrences="12" value="r_ha" /> + <ngram occurrences="12" value="r_f" /> + <ngram occurrences="12" value="r_de" /> + <ngram occurrences="12" value="n_han" /> + <ngram occurrences="12" value="lo" /> + <ngram occurrences="12" value="lig" /> + <ngram occurrences="12" value="ko" /> + <ngram occurrences="12" value="ing" /> + <ngram occurrences="12" value="ikke_" /> + <ngram occurrences="12" value="ikke" /> + <ngram occurrences="12" value="hv" /> + <ngram occurrences="12" value="hen" /> + <ngram occurrences="12" value="enne" /> + <ngram occurrences="12" value="em" /> + <ngram occurrences="12" value="e_ha" /> + <ngram occurrences="12" value="den_" /> + <ngram occurrences="12" value="den" /> + <ngram occurrences="12" value="_vi" /> + <ngram occurrences="12" value="_ve" /> + <ngram occurrences="12" value="_ikke" /> + <ngram occurrences="12" value="_ikk" /> + <ngram occurrences="12" value="_ik" /> + <ngram occurrences="12" value="_av" /> + <ngram occurrences="11" value="tte" /> + <ngram occurrences="11" value="tr" /> + <ngram occurrences="11" value="ten_" /> + <ngram occurrences="11" value="ste_" /> + <ngram occurrences="11" value="r_i" /> + <ngram occurrences="11" value="r_e" /> + <ngram occurrences="11" value="pen_" /> + <ngram occurrences="11" value="pen" /> + <ngram occurrences="11" value="nne_" /> + <ngram occurrences="11" value="ni" /> + <ngram occurrences="11" value="n_v" /> + <ngram occurrences="11" value="n_t" /> + <ngram occurrences="11" value="inn" /> + <ngram occurrences="11" value="ham_" /> + <ngram occurrences="11" value="ham" /> + <ngram occurrences="11" value="ei" /> + <ngram occurrences="11" value="ed_" /> + <ngram occurrences="11" value="e_f" /> + <ngram occurrences="11" value="am_" /> + <ngram occurrences="11" value="_st" /> + <ngram occurrences="11" value="_no" /> + <ngram occurrences="11" value="_ham_" /> + <ngram occurrences="11" value="_ham" /> + <ngram occurrences="11" value="_den_" /> + <ngram occurrences="11" value="_den" /> + <ngram occurrences="11" value="_at" /> + <ngram occurrences="10" value="ær" /> + <ngram occurrences="10" value="æ" /> + <ngram occurrences="10" value="unn" /> + <ngram occurrences="10" value="t_s" /> + <ngram occurrences="10" value="t_han" /> + <ngram occurrences="10" value="så_" /> + <ngram occurrences="10" value="så" /> + <ngram occurrences="10" value="n_k" /> + <ngram occurrences="10" value="ma" /> + <ngram occurrences="10" value="k_" /> + <ngram occurrences="10" value="it" /> + <ngram occurrences="10" value="gen_" /> + <ngram occurrences="10" value="du" /> + <ngram occurrences="10" value="be" /> + <ngram occurrences="10" value="av_" /> + <ngram occurrences="10" value="ans" /> + <ngram occurrences="10" value="_å_" /> + <ngram occurrences="10" value="_un" /> + <ngram occurrences="10" value="_hv" /> + <ngram occurrences="10" value="_hen" /> + <ngram occurrences="9" value="tt_" /> + <ngram occurrences="9" value="sv" /> + <ngram occurrences="9" value="sp" /> + <ngram occurrences="9" value="ser" /> + <ngram occurrences="9" value="seg_" /> + <ngram occurrences="9" value="seg" /> + <ngram occurrences="9" value="rs" /> + <ngram occurrences="9" value="ra" /> + <ngram occurrences="9" value="r_han" /> + <ngram occurrences="9" value="oe" /> + <ngram occurrences="9" value="nni" /> + <ngram occurrences="9" value="ng_" /> + <ngram occurrences="9" value="n_o" /> + <ngram occurrences="9" value="n_me" /> + <ngram occurrences="9" value="men" /> + <ngram occurrences="9" value="med" /> + <ngram occurrences="9" value="lt" /> + <ngram occurrences="9" value="ls" /> + <ngram occurrences="9" value="le_" /> + <ngram occurrences="9" value="ld" /> + <ngram occurrences="9" value="kan" /> + <ngram occurrences="9" value="ig_" /> + <ngram occurrences="9" value="est" /> + <ngram occurrences="9" value="ere" /> + <ngram occurrences="9" value="eng" /> + <ngram occurrences="9" value="en_ha" /> + <ngram occurrences="9" value="els" /> + <ngram occurrences="9" value="e_d" /> + <ngram occurrences="9" value="der" /> + <ngram occurrences="9" value="da" /> + <ngram occurrences="9" value="at_" /> + <ngram occurrences="9" value="ang" /> + <ngram occurrences="9" value="ak" /> + <ngram occurrences="9" value="_va" /> + <ngram occurrences="9" value="_så_" /> + <ngram occurrences="9" value="_så" /> + <ngram occurrences="9" value="_sk" /> + <ngram occurrences="9" value="_seg_" /> + <ngram occurrences="9" value="_seg" /> + <ngram occurrences="9" value="_om_" /> + <ngram occurrences="9" value="_om" /> + <ngram occurrences="9" value="_kan" /> + <ngram occurrences="9" value="_et" /> + <ngram occurrences="9" value="_en_" /> + <ngram occurrences="9" value="_du" /> + <ngram occurrences="9" value="_av_" /> + <ngram occurrences="9" value="_at_" /> + <ngram occurrences="8" value="vo" /> + <ngram occurrences="8" value="unni" /> + <ngram occurrences="8" value="ter_" /> + <ngram occurrences="8" value="t_o" /> + <ngram occurrences="8" value="t_er_" /> + <ngram occurrences="8" value="t_er" /> + <ngram occurrences="8" value="t_a" /> + <ngram occurrences="8" value="ss" /> + <ngram occurrences="8" value="ske" /> + <ngram occurrences="8" value="ser_" /> + <ngram occurrences="8" value="sa" /> + <ngram occurrences="8" value="ru" /> + <ngram occurrences="8" value="rt_" /> + <ngram occurrences="8" value="ro" /> + <ngram occurrences="8" value="rd" /> + <ngram occurrences="8" value="r_o" /> + <ngram occurrences="8" value="pp" /> + <ngram occurrences="8" value="ord" /> + <ngram occurrences="8" value="ol" /> + <ngram occurrences="8" value="og_s" /> + <ngram occurrences="8" value="nn_" /> + <ngram occurrences="8" value="ngen" /> + <ngram occurrences="8" value="n_i" /> + <ngram occurrences="8" value="n_har" /> + <ngram occurrences="8" value="men_" /> + <ngram occurrences="8" value="med_" /> + <ngram occurrences="8" value="lle" /> + <ngram occurrences="8" value="kt" /> + <ngram occurrences="8" value="kan_" /> + <ngram occurrences="8" value="inge" /> + <ngram occurrences="8" value="ie" /> + <ngram occurrences="8" value="henne" /> + <ngram occurrences="8" value="henn" /> + <ngram occurrences="8" value="gan" /> + <ngram occurrences="8" value="ga" /> + <ngram occurrences="8" value="et_e" /> + <ngram occurrences="8" value="er_i" /> + <ngram occurrences="8" value="enne_" /> + <ngram occurrences="8" value="ene_" /> + <ngram occurrences="8" value="en_s" /> + <ngram occurrences="8" value="en_m" /> + <ngram occurrences="8" value="e_m" /> + <ngram occurrences="8" value="e_e" /> + <ngram occurrences="8" value="_unni" /> + <ngram occurrences="8" value="_unn" /> + <ngram occurrences="8" value="_og_s" /> + <ngram occurrences="8" value="_med_" /> + <ngram occurrences="8" value="_med" /> + <ngram occurrences="8" value="_kan_" /> + <ngram occurrences="8" value="_henn" /> + <ngram occurrences="8" value="_de_" /> + <ngram occurrences="8" value="_be" /> + <ngram occurrences="7" value="ør_" /> + <ngram occurrences="7" value="å_h" /> + <ngram occurrences="7" value="var" /> + <ngram occurrences="7" value="t_v" /> + <ngram occurrences="7" value="sl" /> + <ngram occurrences="7" value="si" /> + <ngram occurrences="7" value="sen" /> + <ngram occurrences="7" value="ri" /> + <ngram occurrences="7" value="r_se" /> + <ngram occurrences="7" value="r_a" /> + <ngram occurrences="7" value="ort" /> + <ngram occurrences="7" value="o_" /> + <ngram occurrences="7" value="nå" /> + <ngram occurrences="7" value="noe" /> + <ngram occurrences="7" value="ner" /> + <ngram occurrences="7" value="ne_h" /> + <ngram occurrences="7" value="nde" /> +</ngrams> diff --git a/src/plugins/language/persian.klp b/src/plugins/language/persian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="871" value="_" /> + <ngram occurrences="145" value="þ" /> + <ngram occurrences="144" value="õ" /> + <ngram occurrences="131" value="ø" /> + <ngram occurrences="109" value="õ_" /> + <ngram occurrences="97" value="ù" /> + <ngram occurrences="89" value="þ_" /> + <ngram occurrences="87" value="ø_" /> + <ngram occurrences="85" value="_ø" /> + <ngram occurrences="83" value="¨" /> + <ngram occurrences="81" value="ö" /> + <ngram occurrences="81" value="_ù" /> + <ngram occurrences="79" value="_ö" /> + <ngram occurrences="71" value="_þ" /> + <ngram occurrences="68" value="ü" /> + <ngram occurrences="66" value="_ø_" /> + <ngram occurrences="63" value="î" /> + <ngram occurrences="61" value="_¨" /> + <ngram occurrences="60" value="ù_" /> + <ngram occurrences="60" value="_õ" /> + <ngram occurrences="58" value="_ü" /> + <ngram occurrences="55" value="¨_" /> + <ngram occurrences="53" value="ª" /> + <ngram occurrences="53" value="_ù_" /> + <ngram occurrences="50" value="ý" /> + <ngram occurrences="50" value="_ý" /> + <ngram occurrences="49" value="î_" /> + <ngram occurrences="48" value="ý_" /> + <ngram occurrences="48" value="_ý_" /> + <ngram occurrences="48" value="_õ_" /> + <ngram occurrences="47" value="ó" /> + <ngram occurrences="46" value="û" /> + <ngram occurrences="46" value="ö_" /> + <ngram occurrences="45" value="ê" /> + <ngram occurrences="44" value="_¨_" /> + <ngram occurrences="44" value="_þ_" /> + <ngram occurrences="44" value="_ö_" /> + <ngram occurrences="36" value="ü_" /> + <ngram occurrences="36" value="_ê" /> + <ngram occurrences="34" value="û_" /> + <ngram occurrences="32" value="ò" /> + <ngram occurrences="32" value="_û" /> + <ngram occurrences="31" value="ú" /> + <ngram occurrences="31" value="ñ" /> + <ngram occurrences="31" value="_ü_" /> + <ngram occurrences="31" value="_î" /> + <ngram occurrences="29" value="ð" /> + <ngram occurrences="29" value="ê_" /> + <ngram occurrences="29" value="ª_" /> + <ngram occurrences="28" value="_ñ" /> + <ngram occurrences="27" value="ô" /> + <ngram occurrences="27" value="y" /> + <ngram occurrences="27" value="s" /> + <ngram occurrences="27" value="_ª" /> + <ngram occurrences="26" value="_ú" /> + <ngram occurrences="26" value="_ê_" /> + <ngram occurrences="24" value="ð_" /> + <ngram occurrences="22" value="þõ" /> + <ngram occurrences="22" value="ñ_" /> + <ngram occurrences="22" value="ì" /> + <ngram occurrences="22" value="_î_" /> + <ngram occurrences="22" value="_s" /> + <ngram occurrences="21" value="_û_" /> + <ngram occurrences="21" value="_ô" /> + <ngram occurrences="20" value="ä" /> + <ngram occurrences="20" value="_ª_" /> + <ngram occurrences="19" value="_ñ_" /> + <ngram occurrences="18" value="þõ_" /> + <ngram occurrences="18" value="öþ" /> + <ngram occurrences="18" value="y_" /> + <ngram occurrences="18" value="_öþ" /> + <ngram occurrences="17" value="õ_ø" /> + <ngram occurrences="17" value="ó_" /> + <ngram occurrences="17" value="ò_" /> + <ngram occurrences="17" value="ì_" /> + <ngram occurrences="16" value="þó" /> + <ngram occurrences="16" value="öþ_" /> + <ngram occurrences="16" value="ä_" /> + <ngram occurrences="16" value="s_" /> + <ngram occurrences="16" value="_öþ_" /> + <ngram occurrences="15" value="üõ" /> + <ngram occurrences="15" value="ú_" /> + <ngram occurrences="15" value="ø_ù" /> + <ngram occurrences="15" value="ö_þ" /> + <ngram occurrences="15" value="ã" /> + <ngram occurrences="15" value="_ö_þ" /> + <ngram occurrences="15" value="_ò" /> + <ngram occurrences="14" value="ý_û" /> + <ngram occurrences="14" value="ùî_" /> + <ngram occurrences="14" value="ùî" /> + <ngram occurrences="14" value="öø" /> + <ngram occurrences="14" value="_ý_û" /> + <ngram occurrences="14" value="_ú_" /> + <ngram occurrences="14" value="_öø" /> + <ngram occurrences="13" value="þ_ø" /> + <ngram occurrences="13" value="þ_ö" /> + <ngram occurrences="13" value="õ_þ" /> + <ngram occurrences="13" value="õ_ø_" /> + <ngram occurrences="13" value="_ùî_" /> + <ngram occurrences="13" value="_ùî" /> + <ngram occurrences="13" value="_s_" /> + <ngram occurrences="12" value="þ_ø_" /> + <ngram occurrences="12" value="ø_ù_" /> + <ngram occurrences="12" value="óþ" /> + <ngram occurrences="12" value="_ø_ù" /> + <ngram occurrences="12" value="_ð" /> + <ngram occurrences="11" value="þ_ü" /> + <ngram occurrences="11" value="ô_" /> + <ngram occurrences="11" value="_üõ" /> + <ngram occurrences="11" value="_ì_" /> + <ngram occurrences="11" value="_ì" /> + <ngram occurrences="10" value="þóþõ_" /> + <ngram occurrences="10" value="þóþõ" /> + <ngram occurrences="10" value="þóþ" /> + <ngram occurrences="10" value="øª" /> + <ngram occurrences="10" value="ø_ü" /> + <ngram occurrences="10" value="ö_þ_" /> + <ngram occurrences="10" value="õ_ü" /> + <ngram occurrences="10" value="õ_ö" /> + <ngram occurrences="10" value="óþõ_" /> + <ngram occurrences="10" value="óþõ" /> + <ngram occurrences="10" value="ñ_¨" /> + <ngram occurrences="10" value="_þõ" /> + <ngram occurrences="10" value="_øª" /> + <ngram occurrences="10" value="_ø_ü" /> + <ngram occurrences="10" value="_ö_þ_" /> + <ngram occurrences="10" value="_õ_ø" /> + <ngram occurrences="10" value="_ò_" /> + <ngram occurrences="10" value="_y" /> + <ngram occurrences="9" value="¨_ù" /> + <ngram occurrences="9" value="ü_õ" /> + <ngram occurrences="9" value="øþ" /> + <ngram occurrences="9" value="øõ" /> + <ngram occurrences="9" value="ã_" /> + <ngram occurrences="9" value="ªî_" /> + <ngram occurrences="9" value="ªî" /> + <ngram occurrences="9" value="_ø_ù_" /> + <ngram occurrences="9" value="_ð_" /> + <ngram occurrences="9" value="_ä" /> + <ngram occurrences="8" value="¨õ" /> + <ngram occurrences="8" value="þ_ö_" /> + <ngram occurrences="8" value="ûù" /> + <ngram occurrences="8" value="øþóþõ" /> + <ngram occurrences="8" value="øþóþ" /> + <ngram occurrences="8" value="øþó" /> + <ngram occurrences="8" value="øõ_" /> + <ngram occurrences="8" value="öøþóþ" /> + <ngram occurrences="8" value="öøþó" /> + <ngram occurrences="8" value="öøþ" /> + <ngram occurrences="8" value="_¨_ù" /> + <ngram occurrences="8" value="_þõ_" /> + <ngram occurrences="8" value="_þ_ü" /> + <ngram occurrences="8" value="_ü_õ" /> + <ngram occurrences="8" value="_öøþó" /> + <ngram occurrences="8" value="_öøþ" /> + <ngram occurrences="8" value="_õ_ø_" /> + <ngram occurrences="8" value="_ô_" /> + <ngram occurrences="8" value="_ñ_¨" /> + <ngram occurrences="8" value="_ã" /> + <ngram occurrences="8" value="_y_" /> + <ngram occurrences="7" value="þ_þ" /> + <ngram occurrences="7" value="þ_ü_" /> + <ngram occurrences="7" value="ý_ú" /> + <ngram occurrences="7" value="üõ_" /> + <ngram occurrences="7" value="üð_" /> + <ngram occurrences="7" value="üð" /> + <ngram occurrences="7" value="ù_þ" /> + <ngram occurrences="7" value="ù_ø" /> + <ngram occurrences="7" value="ù_õ" /> + <ngram occurrences="7" value="ø_¨" /> + <ngram occurrences="7" value="ø_ö" /> + <ngram occurrences="7" value="öþ_ø_" /> + <ngram occurrences="7" value="öþ_ø" /> + <ngram occurrences="7" value="ö_¨_" /> + <ngram occurrences="7" value="ö_¨" /> + <ngram occurrences="7" value="õ_þ_" /> + <ngram occurrences="7" value="õ_ü_" /> + <ngram occurrences="7" value="õ_ù_" /> + <ngram occurrences="7" value="õ_ù" /> + <ngram occurrences="7" value="ò_öøþ" /> + <ngram occurrences="7" value="ò_öø" /> + <ngram occurrences="7" value="ò_ö" /> + <ngram occurrences="7" value="à" /> + <ngram occurrences="7" value="yõ_" /> + <ngram occurrences="7" value="yõ" /> + <ngram occurrences="7" value="s_ò_" /> + <ngram occurrences="7" value="s_ò" /> + <ngram occurrences="7" value="f_" /> + <ngram occurrences="7" value="f" /> + <ngram occurrences="7" value="_ý_ú" /> + <ngram occurrences="7" value="_üð_" /> + <ngram occurrences="7" value="_üð" /> + <ngram occurrences="7" value="_ûù" /> + <ngram occurrences="7" value="_ù_õ" /> + <ngram occurrences="7" value="_öþ_ø" /> + <ngram occurrences="7" value="_ó" /> + <ngram occurrences="7" value="_ò_öø" /> + <ngram occurrences="7" value="_ò_ö" /> + <ngram occurrences="7" value="_f_" /> + <ngram occurrences="7" value="_f" /> + <ngram occurrences="6" value="¨_ý_" /> + <ngram occurrences="6" value="¨_ý" /> + <ngram occurrences="6" value="¨_ö" /> + <ngram occurrences="6" value="ý_ûù" /> + <ngram occurrences="6" value="ü_¨" /> + <ngram occurrences="6" value="ü_õ_" /> + <ngram occurrences="6" value="ûù_" /> + <ngram occurrences="6" value="û_ø_" /> + <ngram occurrences="6" value="û_ø" /> + <ngram occurrences="6" value="ù_þ_" /> + <ngram occurrences="6" value="øªî_" /> + <ngram occurrences="6" value="øªî" /> + <ngram occurrences="6" value="ø_¨_" /> + <ngram occurrences="6" value="ø_ü_" /> + <ngram occurrences="6" value="ø_ö_" /> + <ngram occurrences="6" value="ø_õ" /> + <ngram occurrences="6" value="õó" /> + <ngram occurrences="6" value="õª" /> + <ngram occurrences="6" value="õ_ô" /> + <ngram occurrences="6" value="ôþ" /> + <ngram occurrences="6" value="ô_õ_" /> + <ngram occurrences="6" value="ô_õ" /> + <ngram occurrences="6" value="ó_ù" /> + <ngram occurrences="6" value="ñ_¨_" /> + <ngram occurrences="6" value="êð" /> + <ngram occurrences="6" value="s_ò_ö" /> + <ngram occurrences="6" value="_¨_ö" /> + <ngram occurrences="6" value="_ý_ûù" /> + <ngram occurrences="6" value="_ü_¨" /> + <ngram occurrences="6" value="_ü_õ_" /> + <ngram occurrences="6" value="_ù_þ" /> + <ngram occurrences="6" value="_øªî_" /> + <ngram occurrences="6" value="_øªî" /> + <ngram occurrences="6" value="_ø_¨_" /> + <ngram occurrences="6" value="_ø_¨" /> + <ngram occurrences="6" value="_ø_ü_" /> + <ngram occurrences="6" value="_ø_ö" /> + <ngram occurrences="6" value="_ö_¨_" /> + <ngram occurrences="6" value="_ö_¨" /> + <ngram occurrences="6" value="_õ_ü" /> + <ngram occurrences="6" value="_êð" /> + <ngram occurrences="6" value="_ä_" /> + <ngram occurrences="6" value="_ã_" /> + <ngram occurrences="6" value="_s_ò_" /> + <ngram occurrences="6" value="_s_ò" /> + <ngram occurrences="5" value="¨ø" /> + <ngram occurrences="5" value="¨õ_" /> + <ngram occurrences="5" value="¨_ù_" /> + <ngram occurrences="5" value="¨_ö_" /> + <ngram occurrences="5" value="¨_ñ" /> + <ngram occurrences="5" value="þ_¨" /> + <ngram occurrences="5" value="þ_û_" /> + <ngram occurrences="5" value="þ_û" /> + <ngram occurrences="5" value="þ_ù" /> + <ngram occurrences="5" value="þ_õ" /> + <ngram occurrences="5" value="ý_þ" /> + <ngram occurrences="5" value="ý_û_" /> + <ngram occurrences="5" value="ü_ª" /> + <ngram occurrences="5" value="úª" /> + <ngram occurrences="5" value="ùþ" /> + <ngram occurrences="5" value="ùõ" /> + <ngram occurrences="5" value="ù_ø_" /> + <ngram occurrences="5" value="ø_ý_" /> + <ngram occurrences="5" value="ø_ý" /> + <ngram occurrences="5" value="ø_õ_" /> + <ngram occurrences="5" value="ø_ê_" /> + <ngram occurrences="5" value="ø_ê" /> + <ngram occurrences="5" value="ö_ø_" /> + <ngram occurrences="5" value="ö_ø" /> + <ngram occurrences="5" value="õû" /> + <ngram occurrences="5" value="õ_ý_" /> + <ngram occurrences="5" value="õ_ý" /> + <ngram occurrences="5" value="õ_ø_ù" /> + <ngram occurrences="5" value="ôò" /> + <ngram occurrences="5" value="ñþ" /> + <ngram occurrences="5" value="î_ý_" /> + <ngram occurrences="5" value="î_ý" /> + <ngram occurrences="5" value="î_ü" /> + <ngram occurrences="5" value="î_ù" /> + <ngram occurrences="5" value="î_ö" /> + <ngram occurrences="5" value="î_ª" /> + <ngram occurrences="5" value="êð_" /> + <ngram occurrences="5" value="è" /> + <ngram occurrences="5" value="y_ö" /> + <ngram occurrences="5" value="_¨_ö_" /> + <ngram occurrences="5" value="_¨_ñ" /> + <ngram occurrences="5" value="_þó" /> + <ngram occurrences="5" value="_þ_ö" /> + <ngram occurrences="5" value="_ý_þ" /> + <ngram occurrences="5" value="_ý_û_" /> + <ngram occurrences="5" value="_ü_ª" /> + <ngram occurrences="5" value="_ûù_" /> + <ngram occurrences="5" value="_úª" /> + <ngram occurrences="5" value="_ù_þ_" /> + <ngram occurrences="5" value="_ø_ö_" /> + <ngram occurrences="5" value="_ø_ê_" /> + <ngram occurrences="5" value="_ø_ê" /> + <ngram occurrences="5" value="_ö_ø_" /> + <ngram occurrences="5" value="_ö_ø" /> + <ngram occurrences="5" value="_õ_ü_" /> + <ngram occurrences="5" value="_õ_ù_" /> + <ngram occurrences="5" value="_õ_ù" /> + <ngram occurrences="5" value="_ô_õ_" /> + <ngram occurrences="5" value="_ô_õ" /> + <ngram occurrences="5" value="_ó_" /> + <ngram occurrences="5" value="_ñþ" /> + <ngram occurrences="5" value="_êð_" /> + <ngram occurrences="4" value="¨_ø_" /> + <ngram occurrences="4" value="¨_ø" /> + <ngram occurrences="4" value="¨_ñ_" /> + <ngram occurrences="4" value="¨_ê" /> + <ngram occurrences="4" value="þ¨_" /> + <ngram occurrences="4" value="þ¨" /> + <ngram occurrences="4" value="þõ_f_" /> + <ngram occurrences="4" value="þõ_f" /> + <ngram occurrences="4" value="þ_¨_" /> + <ngram occurrences="4" value="þ_þ_" /> + <ngram occurrences="4" value="þ_ý_" /> + <ngram occurrences="4" value="þ_ý" /> + <ngram occurrences="4" value="þ_ü_¨" /> + <ngram occurrences="4" value="þ_ø_ê" /> + <ngram occurrences="4" value="þ_ö_þ" /> + <ngram occurrences="4" value="þ_ê" /> + <ngram occurrences="4" value="þ_ª" /> + <ngram occurrences="4" value="ý_ûù_" /> + <ngram occurrences="4" value="ý_ú_" /> + <ngram occurrences="4" value="ý_ø" /> + <ngram occurrences="4" value="ü_¨_" /> + <ngram occurrences="4" value="ü_ø" /> + <ngram occurrences="4" value="û_ö" /> + <ngram occurrences="4" value="û_ê_" /> + <ngram occurrences="4" value="û_ê" /> + <ngram occurrences="4" value="ùõ_" /> + <ngram occurrences="4" value="ù_¨" /> + <ngram occurrences="4" value="ù_ü" /> + <ngram occurrences="4" value="ù_ö_" /> + <ngram occurrences="4" value="ù_ö" /> + <ngram occurrences="4" value="ù_õ_" /> + <ngram occurrences="4" value="ù_ð" /> + <ngram occurrences="4" value="ù_ª" /> + <ngram occurrences="4" value="øó" /> + <ngram occurrences="4" value="ø_s_" /> + <ngram occurrences="4" value="ø_s" /> + <ngram occurrences="4" value="öø_" /> + <ngram occurrences="4" value="ö_ú_" /> + <ngram occurrences="4" value="ö_ú" /> + <ngram occurrences="4" value="ö_õ" /> + <ngram occurrences="4" value="õû_" /> + <ngram occurrences="4" value="õò" /> + <ngram occurrences="4" value="õª_" /> + <ngram occurrences="4" value="õ_ú" /> + <ngram occurrences="4" value="õ_öþ_" /> + <ngram occurrences="4" value="õ_öþ" /> + <ngram occurrences="4" value="õ_ö_" /> + <ngram occurrences="4" value="õ_f_" /> + <ngram occurrences="4" value="õ_f" /> + <ngram occurrences="4" value="ôþ_" /> + <ngram occurrences="4" value="ôòä_" /> + <ngram occurrences="4" value="ôòä" /> + <ngram occurrences="4" value="óþõ_f" /> + <ngram occurrences="4" value="óø" /> + <ngram occurrences="4" value="óõ" /> + <ngram occurrences="4" value="ó_ù_" /> + <ngram occurrences="4" value="ò¨" /> + <ngram occurrences="4" value="òä_" /> + <ngram occurrences="4" value="òä" /> + <ngram occurrences="4" value="ð_û_" /> + <ngram occurrences="4" value="ð_û" /> + <ngram occurrences="4" value="î_þ" /> + <ngram occurrences="4" value="î_ª_" /> + <ngram occurrences="4" value="ì_ü" /> + <ngram occurrences="4" value="ë" /> + <ngram occurrences="4" value="ê_ý_" /> + <ngram occurrences="4" value="ê_ý" /> + <ngram occurrences="4" value="ê_ü" /> + <ngram occurrences="4" value="ê_ù" /> + <ngram occurrences="4" value="é" /> + <ngram occurrences="4" value="è_" /> + <ngram occurrences="4" value="á" /> + <ngram occurrences="4" value="ª_û_" /> + <ngram occurrences="4" value="ª_û" /> + <ngram occurrences="4" value="sô" /> + <ngram occurrences="4" value="_¨õ" /> + <ngram occurrences="4" value="_¨_ý_" /> + <ngram occurrences="4" value="_¨_ý" /> + <ngram occurrences="4" value="_¨_ù_" /> + <ngram occurrences="4" value="_¨_ñ_" /> + <ngram occurrences="4" value="_¨_ê" /> + <ngram occurrences="4" value="_þ_ü_" /> + <ngram occurrences="4" value="_þ_ù" /> + <ngram occurrences="4" value="_þ_ê" /> + <ngram occurrences="4" value="_ý_ú_" /> + <ngram occurrences="4" value="_ý_ø" /> + <ngram occurrences="4" value="_ü_¨_" /> + <ngram occurrences="4" value="_û_ö" /> + <ngram occurrences="4" value="_û_ê_" /> + <ngram occurrences="4" value="_û_ê" /> + <ngram occurrences="4" value="_ù_¨" /> + <ngram occurrences="4" value="_ù_ø" /> + <ngram occurrences="4" value="_ù_õ_" /> +</ngrams> diff --git a/src/plugins/language/polish.klp b/src/plugins/language/polish.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="718" value="_" /> + <ngram occurrences="340" value="e" /> + <ngram occurrences="328" value="a" /> + <ngram occurrences="326" value="i" /> + <ngram occurrences="283" value="o" /> + <ngram occurrences="234" value="n" /> + <ngram occurrences="222" value="z" /> + <ngram occurrences="174" value="w" /> + <ngram occurrences="173" value="r" /> + <ngram occurrences="155" value="s" /> + <ngram occurrences="153" value="y" /> + <ngram occurrences="147" value="t" /> + <ngram occurrences="141" value="c" /> + <ngram occurrences="131" value="p" /> + <ngram occurrences="131" value="k" /> + <ngram occurrences="131" value="d" /> + <ngram occurrences="109" value="ie" /> + <ngram occurrences="106" value="m" /> + <ngram occurrences="99" value="u" /> + <ngram occurrences="97" value="_p" /> + <ngram occurrences="94" value="ni" /> + <ngram occurrences="92" value="o_" /> + <ngram occurrences="92" value="l" /> + <ngram occurrences="92" value="j" /> + <ngram occurrences="91" value="a_" /> + <ngram occurrences="88" value="e_" /> + <ngram occurrences="75" value="³" /> + <ngram occurrences="74" value="i_" /> + <ngram occurrences="72" value="g" /> + <ngram occurrences="67" value="_w" /> + <ngram occurrences="64" value="b" /> + <ngram occurrences="62" value="_n" /> + <ngram occurrences="56" value="y_" /> + <ngram occurrences="51" value="_s" /> + <ngram occurrences="49" value="ze" /> + <ngram occurrences="47" value="_d" /> + <ngram occurrences="45" value="ê" /> + <ngram occurrences="45" value="_z" /> + <ngram occurrences="44" value="na" /> + <ngram occurrences="44" value="ie_" /> + <ngram occurrences="43" value="pr" /> + <ngram occurrences="42" value="sz" /> + <ngram occurrences="41" value="cz" /> + <ngram occurrences="40" value="po" /> + <ngram occurrences="39" value="u_" /> + <ngram occurrences="39" value="st" /> + <ngram occurrences="38" value="nie" /> + <ngram occurrences="38" value="m_" /> + <ngram occurrences="38" value="_t" /> + <ngram occurrences="37" value="wi" /> + <ngram occurrences="37" value="_po" /> + <ngram occurrences="35" value="za" /> + <ngram occurrences="35" value="w_" /> + <ngram occurrences="35" value="rz" /> + <ngram occurrences="35" value="an" /> + <ngram occurrences="34" value="ra" /> + <ngram occurrences="34" value="_pr" /> + <ngram occurrences="32" value="ow" /> + <ngram occurrences="32" value="j_" /> + <ngram occurrences="32" value="h" /> + <ngram occurrences="32" value="en" /> + <ngram occurrences="31" value="ej" /> + <ngram occurrences="31" value="_na" /> + <ngram occurrences="31" value="_k" /> + <ngram occurrences="31" value="_b" /> + <ngram occurrences="30" value="zy" /> + <ngram occurrences="30" value="ki" /> + <ngram occurrences="30" value="_j" /> + <ngram occurrences="29" value="ro" /> + <ngram occurrences="29" value="ej_" /> + <ngram occurrences="29" value="ch" /> + <ngram occurrences="28" value="ó" /> + <ngram occurrences="28" value="wa" /> + <ngram occurrences="28" value="eg" /> + <ngram occurrences="28" value="do" /> + <ngram occurrences="28" value="_ni" /> + <ngram occurrences="27" value="ne" /> + <ngram occurrences="27" value="_o" /> + <ngram occurrences="26" value="ta" /> + <ngram occurrences="26" value="ko" /> + <ngram occurrences="26" value="ia" /> + <ngram occurrences="26" value="_c" /> + <ngram occurrences="25" value="nie_" /> + <ngram occurrences="25" value="li" /> + <ngram occurrences="25" value="em" /> + <ngram occurrences="25" value="dz" /> + <ngram occurrences="25" value="_w_" /> + <ngram occurrences="25" value="_nie" /> + <ngram occurrences="24" value="ê_" /> + <ngram occurrences="24" value="to" /> + <ngram occurrences="24" value="_m" /> + <ngram occurrences="24" value="_i" /> + <ngram occurrences="23" value="go" /> + <ngram occurrences="21" value="z_" /> + <ngram occurrences="21" value="iê" /> + <ngram occurrences="21" value="ci" /> + <ngram occurrences="21" value="_za" /> + <ngram occurrences="21" value="_do" /> + <ngram occurrences="20" value="³_" /> + <ngram occurrences="20" value="te" /> + <ngram occurrences="20" value="or" /> + <ngram occurrences="20" value="le" /> + <ngram occurrences="20" value="by" /> + <ngram occurrences="20" value="al" /> + <ngram occurrences="20" value="_a" /> + <ngram occurrences="19" value="yc" /> + <ngram occurrences="19" value="wy" /> + <ngram occurrences="19" value="sk" /> + <ngram occurrences="19" value="re" /> + <ngram occurrences="19" value="ka" /> + <ngram occurrences="19" value="h_" /> + <ngram occurrences="19" value="go_" /> + <ngram occurrences="19" value="ego_" /> + <ngram occurrences="19" value="ego" /> + <ngram occurrences="19" value="cze" /> + <ngram occurrences="19" value="ch_" /> + <ngram occurrences="19" value="a³" /> + <ngram occurrences="19" value="aw" /> + <ngram occurrences="19" value="ani" /> + <ngram occurrences="19" value="_i_" /> + <ngram occurrences="19" value="_e" /> + <ngram occurrences="18" value="³o" /> + <ngram occurrences="18" value="zi" /> + <ngram occurrences="18" value="mi" /> + <ngram occurrences="18" value="je" /> + <ngram occurrences="18" value="ak" /> + <ngram occurrences="18" value="ac" /> + <ngram occurrences="18" value="_r" /> + <ngram occurrences="18" value="_g" /> + <ngram occurrences="17" value="ty" /> + <ngram occurrences="17" value="rze" /> + <ngram occurrences="17" value="em_" /> + <ngram occurrences="17" value="dzi" /> + <ngram occurrences="17" value="ar" /> + <ngram occurrences="17" value="_l" /> + <ngram occurrences="16" value="æ_" /> + <ngram occurrences="16" value="æ" /> + <ngram occurrences="16" value="zie" /> + <ngram occurrences="16" value="on" /> + <ngram occurrences="16" value="kie" /> + <ngram occurrences="16" value="k_" /> + <ngram occurrences="16" value="es" /> + <ngram occurrences="16" value="do_" /> + <ngram occurrences="16" value="a_p" /> + <ngram occurrences="16" value="_do_" /> + <ngram occurrences="15" value="ów" /> + <ngram occurrences="15" value="wie" /> + <ngram occurrences="15" value="prz" /> + <ngram occurrences="15" value="om" /> + <ngram occurrences="15" value="o_p" /> + <ngram occurrences="15" value="ny" /> + <ngram occurrences="15" value="na_" /> + <ngram occurrences="15" value="el" /> + <ngram occurrences="15" value="dzie" /> + <ngram occurrences="15" value="_prz" /> + <ngram occurrences="14" value="³a" /> + <ngram occurrences="14" value="ych" /> + <ngram occurrences="14" value="to_" /> + <ngram occurrences="14" value="ja" /> + <ngram occurrences="14" value="ic" /> + <ngram occurrences="14" value="er" /> + <ngram occurrences="14" value="eni" /> + <ngram occurrences="14" value="ec" /> + <ngram occurrences="14" value="am" /> + <ngram occurrences="14" value="_wi" /> + <ngram occurrences="14" value="_nie_" /> + <ngram occurrences="14" value="_je" /> + <ngram occurrences="13" value="ñ" /> + <ngram occurrences="13" value="zc" /> + <ngram occurrences="13" value="ym" /> + <ngram occurrences="13" value="ych_" /> + <ngram occurrences="13" value="ws" /> + <ngram occurrences="13" value="tr" /> + <ngram occurrences="13" value="pra" /> + <ngram occurrences="13" value="pi" /> + <ngram occurrences="13" value="pa" /> + <ngram occurrences="13" value="ol" /> + <ngram occurrences="13" value="od" /> + <ngram occurrences="13" value="ma" /> + <ngram occurrences="13" value="f" /> + <ngram occurrences="13" value="ez" /> + <ngram occurrences="13" value="ek" /> + <ngram occurrences="13" value="ed" /> + <ngram occurrences="13" value="dn" /> + <ngram occurrences="13" value="de" /> + <ngram occurrences="12" value="zn" /> + <ngram occurrences="12" value="ym_" /> + <ngram occurrences="12" value="szc" /> + <ngram occurrences="12" value="owa" /> + <ngram occurrences="12" value="ok" /> + <ngram occurrences="12" value="ob" /> + <ngram occurrences="12" value="nej_" /> + <ngram occurrences="12" value="nej" /> + <ngram occurrences="12" value="ce" /> + <ngram occurrences="12" value="as" /> + <ngram occurrences="12" value="_wy" /> + <ngram occurrences="12" value="_u" /> + <ngram occurrences="12" value="_e_" /> + <ngram occurrences="12" value="_by" /> + <ngram occurrences="11" value="zcz" /> + <ngram occurrences="11" value="ys" /> + <ngram occurrences="11" value="wo" /> + <ngram occurrences="11" value="we" /> + <ngram occurrences="11" value="wa_" /> + <ngram occurrences="11" value="szcz" /> + <ngram occurrences="11" value="prze" /> + <ngram occurrences="11" value="no" /> + <ngram occurrences="11" value="ni_" /> + <ngram occurrences="11" value="li_" /> + <ngram occurrences="11" value="ku" /> + <ngram occurrences="11" value="is" /> + <ngram occurrences="11" value="gr" /> + <ngram occurrences="11" value="dy" /> + <ngram occurrences="11" value="ad" /> + <ngram occurrences="11" value="_sz" /> + <ngram occurrences="11" value="_prze" /> + <ngram occurrences="11" value="_na_" /> + <ngram occurrences="10" value="³o_" /> + <ngram occurrences="10" value="ze_" /> + <ngram occurrences="10" value="ud" /> + <ngram occurrences="10" value="t_" /> + <ngram occurrences="10" value="ski" /> + <ngram occurrences="10" value="rzy" /> + <ngram occurrences="10" value="os" /> + <ngram occurrences="10" value="og" /> + <ngram occurrences="10" value="nt" /> + <ngram occurrences="10" value="nia" /> + <ngram occurrences="10" value="ln" /> + <ngram occurrences="10" value="iê_" /> + <ngram occurrences="10" value="iej" /> + <ngram occurrences="10" value="ia_" /> + <ngram occurrences="10" value="i_w" /> + <ngram occurrences="10" value="ent" /> + <ngram occurrences="10" value="e_p" /> + <ngram occurrences="10" value="e_b" /> + <ngram occurrences="10" value="cj" /> + <ngram occurrences="10" value="a³_" /> + <ngram occurrences="10" value="at" /> + <ngram occurrences="10" value="aj" /> + <ngram occurrences="10" value="_z_" /> + <ngram occurrences="10" value="_to_" /> + <ngram occurrences="10" value="_to" /> + <ngram occurrences="10" value="_ja" /> + <ngram occurrences="9" value="zy_" /> + <ngram occurrences="9" value="y³" /> + <ngram occurrences="9" value="us" /> + <ngram occurrences="9" value="tw" /> + <ngram occurrences="9" value="si" /> + <ngram occurrences="9" value="ru" /> + <ngram occurrences="9" value="ot" /> + <ngram occurrences="9" value="my" /> + <ngram occurrences="9" value="ki_" /> + <ngram occurrences="9" value="in" /> + <ngram occurrences="9" value="i_p" /> + <ngram occurrences="9" value="e_n" /> + <ngram occurrences="9" value="da" /> + <ngram occurrences="9" value="by³" /> + <ngram occurrences="9" value="by_" /> + <ngram occurrences="9" value="a_po" /> + <ngram occurrences="9" value="_ty" /> + <ngram occurrences="9" value="_pa" /> + <ngram occurrences="9" value="_ko" /> + <ngram occurrences="9" value="_cz" /> + <ngram occurrences="8" value="ów_" /> + <ngram occurrences="8" value="ñs" /> + <ngram occurrences="8" value="ê_p" /> + <ngram occurrences="8" value="³y" /> + <ngram occurrences="8" value="zcze" /> + <ngram occurrences="8" value="tó" /> + <ngram occurrences="8" value="szcze" /> + <ngram occurrences="8" value="raw" /> + <ngram occurrences="8" value="pre" /> + <ngram occurrences="8" value="praw" /> + <ngram occurrences="8" value="pan" /> + <ngram occurrences="8" value="o_w" /> + <ngram occurrences="8" value="no_" /> + <ngram occurrences="8" value="nia_" /> + <ngram occurrences="8" value="nego_" /> + <ngram occurrences="8" value="nego" /> + <ngram occurrences="8" value="neg" /> + <ngram occurrences="8" value="la" /> + <ngram occurrences="8" value="kt" /> + <ngram occurrences="8" value="iej_" /> + <ngram occurrences="8" value="ga" /> + <ngram occurrences="8" value="esz" /> + <ngram occurrences="8" value="dr" /> + <ngram occurrences="8" value="bo" /> + <ngram occurrences="8" value="a_z" /> + <ngram occurrences="8" value="a_w" /> + <ngram occurrences="8" value="a_n" /> + <ngram occurrences="8" value="_te" /> + <ngram occurrences="8" value="_ta" /> + <ngram occurrences="8" value="_st" /> + <ngram occurrences="8" value="_si" /> + <ngram occurrences="8" value="_ro" /> + <ngram occurrences="8" value="_pra" /> + <ngram occurrences="8" value="_by³" /> + <ngram occurrences="7" value="êd" /> + <ngram occurrences="7" value="³u" /> + <ngram occurrences="7" value="za_" /> + <ngram occurrences="7" value="wsk" /> + <ngram occurrences="7" value="tu" /> + <ngram occurrences="7" value="tem" /> + <ngram occurrences="7" value="sze" /> + <ngram occurrences="7" value="str" /> + <ngram occurrences="7" value="sta" /> + <ngram occurrences="7" value="sp" /> + <ngram occurrences="7" value="skie" /> + <ngram occurrences="7" value="siê_" /> + <ngram occurrences="7" value="siê" /> + <ngram occurrences="7" value="s_" /> + <ngram occurrences="7" value="ry" /> + <ngram occurrences="7" value="rac" /> + <ngram occurrences="7" value="po_" /> + <ngram occurrences="7" value="oc" /> + <ngram occurrences="7" value="o_s" /> + <ngram occurrences="7" value="o_pr" /> + <ngram occurrences="7" value="ny_" /> + <ngram occurrences="7" value="naj" /> + <ngram occurrences="7" value="n_" /> + <ngram occurrences="7" value="my_" /> + <ngram occurrences="7" value="mie" /> + <ngram occurrences="7" value="lu" /> + <ngram occurrences="7" value="le_" /> + <ngram occurrences="7" value="ku_" /> + <ngram occurrences="7" value="ko_" /> + <ngram occurrences="7" value="ka_" /> + <ngram occurrences="7" value="jak" /> + <ngram occurrences="7" value="iu_" /> + <ngram occurrences="7" value="iu" /> + <ngram occurrences="7" value="iel" /> + <ngram occurrences="7" value="ieg" /> + <ngram occurrences="7" value="icz" /> + <ngram occurrences="7" value="i_n" /> + <ngram occurrences="7" value="gi" /> + <ngram occurrences="7" value="et" /> + <ngram occurrences="7" value="edn" /> + <ngram occurrences="7" value="e_s" /> + <ngram occurrences="7" value="e_d" /> + <ngram occurrences="7" value="dni" /> + <ngram occurrences="7" value="czy" /> + <ngram occurrences="7" value="cie" /> + <ngram occurrences="7" value="bi" /> + <ngram occurrences="7" value="be" /> + <ngram occurrences="7" value="añ" /> + <ngram occurrences="7" value="ak_" /> + <ngram occurrences="7" value="a_t" /> + <ngram occurrences="7" value="_wie" /> + <ngram occurrences="7" value="_siê_" /> + <ngram occurrences="7" value="_siê" /> + <ngram occurrences="7" value="_pre" /> + <ngram occurrences="7" value="_po_" /> + <ngram occurrences="7" value="_kt" /> + <ngram occurrences="7" value="_jak" /> + <ngram occurrences="7" value="_gr" /> + <ngram occurrences="7" value="_a_" /> + <ngram occurrences="6" value="ór" /> + <ngram occurrences="6" value="êdz" /> + <ngram occurrences="6" value="êc" /> + <ngram occurrences="6" value="zu" /> + <ngram occurrences="6" value="zen" /> + <ngram occurrences="6" value="yt" /> + <ngram occurrences="6" value="yd" /> + <ngram occurrences="6" value="yb" /> + <ngram occurrences="6" value="y_p" /> + <ngram occurrences="6" value="wski" /> + <ngram occurrences="6" value="wi_" /> + <ngram occurrences="6" value="wan" /> + <ngram occurrences="6" value="usz" /> + <ngram occurrences="6" value="un" /> + <ngram occurrences="6" value="uk" /> + <ngram occurrences="6" value="u_n" /> + <ngram occurrences="6" value="tór" /> + <ngram occurrences="6" value="ta_" /> + <ngram occurrences="6" value="s³" /> + <ngram occurrences="6" value="sy" /> + <ngram occurrences="6" value="stw" /> + <ngram occurrences="6" value="pom" /> + <ngram occurrences="6" value="oz" /> + <ngram occurrences="6" value="ows" /> + <ngram occurrences="6" value="owi" /> + <ngram occurrences="6" value="o_z" /> + <ngram occurrences="6" value="o_po" /> + <ngram occurrences="6" value="o_m" /> + <ngram occurrences="6" value="o_k" /> + <ngram occurrences="6" value="o_i" /> + <ngram occurrences="6" value="o_d" /> + <ngram occurrences="6" value="niu_" /> + <ngram occurrences="6" value="niu" /> + <ngram occurrences="6" value="nic" /> + <ngram occurrences="6" value="nd" /> + <ngram occurrences="6" value="mó" /> + <ngram occurrences="6" value="mo" /> + <ngram occurrences="6" value="m_w" /> + <ngram occurrences="6" value="lne" /> + <ngram occurrences="6" value="któr" /> + <ngram occurrences="6" value="któ" /> + <ngram occurrences="6" value="kr" /> + <ngram occurrences="6" value="ju" /> + <ngram occurrences="6" value="ji_" /> +</ngrams> diff --git a/src/plugins/language/portuguese.klp b/src/plugins/language/portuguese.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="752" value="_" /> + <ngram occurrences="454" value="a" /> + <ngram occurrences="426" value="o" /> + <ngram occurrences="419" value="e" /> + <ngram occurrences="308" value="s" /> + <ngram occurrences="270" value="i" /> + <ngram occurrences="267" value="r" /> + <ngram occurrences="209" value="t" /> + <ngram occurrences="201" value="d" /> + <ngram occurrences="198" value="n" /> + <ngram occurrences="189" value="o_" /> + <ngram occurrences="169" value="m" /> + <ngram occurrences="146" value="u" /> + <ngram occurrences="141" value="a_" /> + <ngram occurrences="138" value="c" /> + <ngram occurrences="136" value="e_" /> + <ngram occurrences="131" value="s_" /> + <ngram occurrences="106" value="p" /> + <ngram occurrences="104" value="_d" /> + <ngram occurrences="97" value="l" /> + <ngram occurrences="79" value="de" /> + <ngram occurrences="78" value="_a" /> + <ngram occurrences="68" value="es" /> + <ngram occurrences="67" value="os" /> + <ngram occurrences="66" value="_p" /> + <ngram occurrences="61" value="ra" /> + <ngram occurrences="61" value="os_" /> + <ngram occurrences="61" value="do" /> + <ngram occurrences="61" value="_s" /> + <ngram occurrences="59" value="nt" /> + <ngram occurrences="59" value="_de" /> + <ngram occurrences="54" value="de_" /> + <ngram occurrences="53" value="v" /> + <ngram occurrences="52" value="_c" /> + <ngram occurrences="49" value="re" /> + <ngram occurrences="49" value="_m" /> + <ngram occurrences="48" value="to" /> + <ngram occurrences="48" value="_e" /> + <ngram occurrences="47" value="te" /> + <ngram occurrences="46" value="r_" /> + <ngram occurrences="46" value="g" /> + <ngram occurrences="46" value="ar" /> + <ngram occurrences="45" value="ta" /> + <ngram occurrences="45" value="or" /> + <ngram occurrences="45" value="co" /> + <ngram occurrences="45" value="_n" /> + <ngram occurrences="44" value="en" /> + <ngram occurrences="43" value="se" /> + <ngram occurrences="43" value="do_" /> + <ngram occurrences="42" value="_de_" /> + <ngram occurrences="41" value="f" /> + <ngram occurrences="41" value="er" /> + <ngram occurrences="40" value="m_" /> + <ngram occurrences="39" value="ma" /> + <ngram occurrences="39" value="as" /> + <ngram occurrences="39" value="_t" /> + <ngram occurrences="38" value="ri" /> + <ngram occurrences="38" value="b" /> + <ngram occurrences="37" value="o_d" /> + <ngram occurrences="37" value="da" /> + <ngram occurrences="37" value="ad" /> + <ngram occurrences="34" value="st" /> + <ngram occurrences="34" value="qu" /> + <ngram occurrences="34" value="q" /> + <ngram occurrences="33" value="no" /> + <ngram occurrences="33" value="_se" /> + <ngram occurrences="33" value="_o" /> + <ngram occurrences="33" value="_co" /> + <ngram occurrences="32" value="ç" /> + <ngram occurrences="32" value="ão" /> + <ngram occurrences="32" value="ã" /> + <ngram occurrences="32" value="is" /> + <ngram occurrences="31" value="ão_" /> + <ngram occurrences="30" value="in" /> + <ngram occurrences="30" value="ia" /> + <ngram occurrences="30" value="an" /> + <ngram occurrences="29" value="me" /> + <ngram occurrences="29" value="es_" /> + <ngram occurrences="28" value="ue" /> + <ngram occurrences="28" value="pa" /> + <ngram occurrences="28" value="_qu" /> + <ngram occurrences="28" value="_q" /> + <ngram occurrences="28" value="_f" /> + <ngram occurrences="27" value="ti" /> + <ngram occurrences="27" value="po" /> + <ngram occurrences="27" value="on" /> + <ngram occurrences="27" value="io" /> + <ngram occurrences="27" value="h" /> + <ngram occurrences="27" value="al" /> + <ngram occurrences="26" value="s_d" /> + <ngram occurrences="26" value="que" /> + <ngram occurrences="26" value="nte" /> + <ngram occurrences="26" value="am" /> + <ngram occurrences="25" value="ent" /> + <ngram occurrences="25" value="ca" /> + <ngram occurrences="25" value="_do" /> + <ngram occurrences="24" value="om" /> + <ngram occurrences="24" value="_que" /> + <ngram occurrences="24" value="_a_" /> + <ngram occurrences="23" value="to_" /> + <ngram occurrences="23" value="em" /> + <ngram occurrences="23" value="ci" /> + <ngram occurrences="23" value="as_" /> + <ngram occurrences="22" value="ra_" /> + <ngram occurrences="21" value="é" /> + <ngram occurrences="21" value="ue_" /> + <ngram occurrences="21" value="u_" /> + <ngram occurrences="21" value="te_" /> + <ngram occurrences="21" value="que_" /> + <ngram occurrences="21" value="_r" /> + <ngram occurrences="21" value="_que_" /> + <ngram occurrences="21" value="_pa" /> + <ngram occurrences="21" value="_no" /> + <ngram occurrences="20" value="o_de" /> + <ngram occurrences="20" value="na" /> + <ngram occurrences="20" value="ec" /> + <ngram occurrences="20" value="_po" /> + <ngram occurrences="19" value="tr" /> + <ngram occurrences="19" value="ic" /> + <ngram occurrences="19" value="em_" /> + <ngram occurrences="19" value="ei" /> + <ngram occurrences="18" value="á" /> + <ngram occurrences="18" value="ss" /> + <ngram occurrences="18" value="si" /> + <ngram occurrences="18" value="ou" /> + <ngram occurrences="18" value="no_" /> + <ngram occurrences="18" value="li" /> + <ngram occurrences="18" value="ce" /> + <ngram occurrences="18" value="aç" /> + <ngram occurrences="18" value="ado" /> + <ngram occurrences="18" value="a_d" /> + <ngram occurrences="18" value="_re" /> + <ngram occurrences="18" value="_i" /> + <ngram occurrences="18" value="_e_" /> + <ngram occurrences="17" value="par" /> + <ngram occurrences="17" value="o_c" /> + <ngram occurrences="17" value="o_a" /> + <ngram occurrences="17" value="nto" /> + <ngram occurrences="17" value="nd" /> + <ngram occurrences="17" value="mi" /> + <ngram occurrences="17" value="id" /> + <ngram occurrences="17" value="_o_" /> + <ngram occurrences="17" value="_do_" /> + <ngram occurrences="17" value="_da" /> + <ngram occurrences="16" value="um" /> + <ngram occurrences="16" value="so" /> + <ngram occurrences="16" value="sa" /> + <ngram occurrences="16" value="res" /> + <ngram occurrences="16" value="pr" /> + <ngram occurrences="16" value="o_p" /> + <ngram occurrences="16" value="men" /> + <ngram occurrences="16" value="l_" /> + <ngram occurrences="16" value="im" /> + <ngram occurrences="16" value="da_" /> + <ngram occurrences="16" value="ai" /> + <ngram occurrences="15" value="í" /> + <ngram occurrences="15" value="ve" /> + <ngram occurrences="15" value="rt" /> + <ngram occurrences="15" value="mo" /> + <ngram occurrences="15" value="it" /> + <ngram occurrences="15" value="il" /> + <ngram occurrences="15" value="el" /> + <ngram occurrences="15" value="ant" /> + <ngram occurrences="15" value="a_a" /> + <ngram occurrences="15" value="_par" /> + <ngram occurrences="15" value="_ma" /> + <ngram occurrences="14" value="ção_" /> + <ngram occurrences="14" value="ção" /> + <ngram occurrences="14" value="çã" /> + <ngram occurrences="14" value="s_de" /> + <ngram occurrences="14" value="ro" /> + <ngram occurrences="14" value="o_s" /> + <ngram occurrences="14" value="o_de_" /> + <ngram occurrences="14" value="ma_" /> + <ngram occurrences="14" value="ia_" /> + <ngram occurrences="14" value="fo" /> + <ngram occurrences="14" value="est" /> + <ngram occurrences="14" value="er_" /> + <ngram occurrences="14" value="e_p" /> + <ngram occurrences="14" value="con" /> + <ngram occurrences="14" value="com" /> + <ngram occurrences="14" value="ara" /> + <ngram occurrences="14" value="a_p" /> + <ngram occurrences="14" value="_l" /> + <ngram occurrences="14" value="_b" /> + <ngram occurrences="13" value="ão_d" /> + <ngram occurrences="13" value="or_" /> + <ngram occurrences="13" value="ont" /> + <ngram occurrences="13" value="nte_" /> + <ngram occurrences="13" value="ment" /> + <ngram occurrences="13" value="la" /> + <ngram occurrences="13" value="ir" /> + <ngram occurrences="13" value="dos_" /> + <ngram occurrences="13" value="dos" /> + <ngram occurrences="13" value="ar_" /> + <ngram occurrences="13" value="ac" /> + <ngram occurrences="13" value="a_de" /> + <ngram occurrences="13" value="_com" /> + <ngram occurrences="12" value="x" /> + <ngram occurrences="12" value="va" /> + <ngram occurrences="12" value="uma_" /> + <ngram occurrences="12" value="uma" /> + <ngram occurrences="12" value="tu" /> + <ngram occurrences="12" value="sta" /> + <ngram occurrences="12" value="s_p" /> + <ngram occurrences="12" value="s_e" /> + <ngram occurrences="12" value="pe" /> + <ngram occurrences="12" value="ou_" /> + <ngram occurrences="12" value="os_d" /> + <ngram occurrences="12" value="nto_" /> + <ngram occurrences="12" value="lh" /> + <ngram occurrences="12" value="ho" /> + <ngram occurrences="12" value="e_d" /> + <ngram occurrences="12" value="e_a" /> + <ngram occurrences="12" value="di" /> + <ngram occurrences="12" value="a_m" /> + <ngram occurrences="12" value="_v" /> + <ngram occurrences="12" value="_no_" /> + <ngram occurrences="12" value="_fo" /> + <ngram occurrences="12" value="_es" /> + <ngram occurrences="11" value="vo" /> + <ngram occurrences="11" value="vi" /> + <ngram occurrences="11" value="tra" /> + <ngram occurrences="11" value="tos_" /> + <ngram occurrences="11" value="tos" /> + <ngram occurrences="11" value="s_a" /> + <ngram occurrences="11" value="rio" /> + <ngram occurrences="11" value="o_m" /> + <ngram occurrences="11" value="o_e" /> + <ngram occurrences="11" value="ni" /> + <ngram occurrences="11" value="is_" /> + <ngram occurrences="11" value="gu" /> + <ngram occurrences="11" value="ente" /> + <ngram occurrences="11" value="e_n" /> + <ngram occurrences="11" value="e_c" /> + <ngram occurrences="11" value="at" /> + <ngram occurrences="11" value="am_" /> + <ngram occurrences="11" value="ado_" /> + <ngram occurrences="11" value="a_s" /> + <ngram occurrences="11" value="_um" /> + <ngram occurrences="11" value="_u" /> + <ngram occurrences="11" value="_pr" /> + <ngram occurrences="11" value="_na" /> + <ngram occurrences="10" value="ção_d" /> + <ngram occurrences="10" value="ur" /> + <ngram occurrences="10" value="ua" /> + <ngram occurrences="10" value="s_t" /> + <ngram occurrences="10" value="s_n" /> + <ngram occurrences="10" value="s_de_" /> + <ngram occurrences="10" value="ria" /> + <ngram occurrences="10" value="r_a" /> + <ngram occurrences="10" value="ol" /> + <ngram occurrences="10" value="o_do" /> + <ngram occurrences="10" value="o_co" /> + <ngram occurrences="10" value="ne" /> + <ngram occurrences="10" value="nc" /> + <ngram occurrences="10" value="mu" /> + <ngram occurrences="10" value="lo" /> + <ngram occurrences="10" value="ist" /> + <ngram occurrences="10" value="io_" /> + <ngram occurrences="10" value="ica" /> + <ngram occurrences="10" value="gr" /> + <ngram occurrences="10" value="e_t" /> + <ngram occurrences="10" value="e_m" /> + <ngram occurrences="10" value="des" /> + <ngram occurrences="10" value="dad" /> + <ngram occurrences="10" value="ação_" /> + <ngram occurrences="10" value="ação" /> + <ngram occurrences="10" value="açã" /> + <ngram occurrences="10" value="ara_" /> + <ngram occurrences="10" value="al_" /> + <ngram occurrences="10" value="ade" /> + <ngram occurrences="10" value="_uma_" /> + <ngram occurrences="10" value="_uma" /> + <ngram occurrences="10" value="_in" /> + <ngram occurrences="10" value="_con" /> + <ngram occurrences="9" value="ões_" /> + <ngram occurrences="9" value="ões" /> + <ngram occurrences="9" value="õe" /> + <ngram occurrences="9" value="õ" /> + <ngram occurrences="9" value="ça" /> + <ngram occurrences="9" value="ul" /> + <ngram occurrences="9" value="ui" /> + <ngram occurrences="9" value="ter" /> + <ngram occurrences="9" value="ta_" /> + <ngram occurrences="9" value="ser" /> + <ngram occurrences="9" value="sen" /> + <ngram occurrences="9" value="rec" /> + <ngram occurrences="9" value="por" /> + <ngram occurrences="9" value="para_" /> + <ngram occurrences="9" value="para" /> + <ngram occurrences="9" value="o_n" /> + <ngram occurrences="9" value="mp" /> + <ngram occurrences="9" value="le" /> + <ngram occurrences="9" value="j" /> + <ngram occurrences="9" value="iv" /> + <ngram occurrences="9" value="ida" /> + <ngram occurrences="9" value="ente_" /> + <ngram occurrences="9" value="eg" /> + <ngram occurrences="9" value="do_p" /> + <ngram occurrences="9" value="ct" /> + <ngram occurrences="9" value="cont" /> + <ngram occurrences="9" value="br" /> + <ngram occurrences="9" value="ap" /> + <ngram occurrences="9" value="a_e" /> + <ngram occurrences="9" value="a_de_" /> + <ngram occurrences="9" value="_te" /> + <ngram occurrences="9" value="_ta" /> + <ngram occurrences="9" value="_por" /> + <ngram occurrences="9" value="_para" /> + <ngram occurrences="9" value="_mi" /> + <ngram occurrences="9" value="_me" /> + <ngram occurrences="9" value="_ap" /> + <ngram occurrences="8" value="z" /> + <ngram occurrences="8" value="tiv" /> + <ngram occurrences="8" value="tes" /> + <ngram occurrences="8" value="tado" /> + <ngram occurrences="8" value="tad" /> + <ngram occurrences="8" value="s_o" /> + <ngram occurrences="8" value="rr" /> + <ngram occurrences="8" value="ov" /> + <ngram occurrences="8" value="oc" /> + <ngram occurrences="8" value="o_t" /> + <ngram occurrences="8" value="o_se" /> + <ngram occurrences="8" value="o_o" /> + <ngram occurrences="8" value="nta" /> + <ngram occurrences="8" value="ns" /> + <ngram occurrences="8" value="mo_" /> + <ngram occurrences="8" value="m_a" /> + <ngram occurrences="8" value="ime" /> + <ngram occurrences="8" value="gra" /> + <ngram occurrences="8" value="gi" /> + <ngram occurrences="8" value="fi" /> + <ngram occurrences="8" value="ess" /> + <ngram occurrences="8" value="ed" /> + <ngram occurrences="8" value="e_s" /> + <ngram occurrences="8" value="ba" /> + <ngram occurrences="8" value="ab" /> + <ngram occurrences="8" value="a_c" /> + <ngram occurrences="8" value="_ser" /> + <ngram occurrences="8" value="_pe" /> + <ngram occurrences="8" value="_os_" /> + <ngram occurrences="8" value="_os" /> + <ngram occurrences="8" value="_mu" /> + <ngram occurrences="8" value="_est" /> + <ngram occurrences="8" value="_em" /> + <ngram occurrences="8" value="_des" /> + <ngram occurrences="8" value="_da_" /> + <ngram occurrences="7" value="ça_" /> + <ngram occurrences="7" value="ão_de" /> + <ngram occurrences="7" value="à" /> + <ngram occurrences="7" value="va_" /> + <ngram occurrences="7" value="ut" /> + <ngram occurrences="7" value="un" /> + <ngram occurrences="7" value="tes_" /> + <ngram occurrences="7" value="tar" /> + <ngram occurrences="7" value="tan" /> + <ngram occurrences="7" value="str" /> + <ngram occurrences="7" value="ser_" /> + <ngram occurrences="7" value="se_" /> + <ngram occurrences="7" value="s_c" /> + <ngram occurrences="7" value="ria_" /> + <ngram occurrences="7" value="res_" /> + <ngram occurrences="7" value="r_m" /> + <ngram occurrences="7" value="os_p" /> + <ngram occurrences="7" value="ort" /> + <ngram occurrences="7" value="omo_" /> + <ngram occurrences="7" value="omo" /> + <ngram occurrences="7" value="o_que" /> + <ngram occurrences="7" value="o_qu" /> + <ngram occurrences="7" value="o_q" /> + <ngram occurrences="7" value="o_i" /> + <ngram occurrences="7" value="nos" /> + <ngram occurrences="7" value="ndo_" /> + <ngram occurrences="7" value="ndo" /> + <ngram occurrences="7" value="min" /> + <ngram occurrences="7" value="mento" /> + <ngram occurrences="7" value="ito" /> + <ngram occurrences="7" value="idad" /> + <ngram occurrences="7" value="i_" /> + <ngram occurrences="7" value="go" /> + <ngram occurrences="7" value="eu" /> + <ngram occurrences="7" value="esta" /> + <ngram occurrences="7" value="ento" /> + <ngram occurrences="7" value="ece" /> + <ngram occurrences="7" value="e_o" /> + <ngram occurrences="7" value="e_de" /> + <ngram occurrences="7" value="das_" /> + <ngram occurrences="7" value="das" /> + <ngram occurrences="7" value="dade" /> + <ngram occurrences="7" value="como_" /> + <ngram occurrences="7" value="como" /> + <ngram occurrences="7" value="cia" /> + <ngram occurrences="7" value="av" /> + <ngram occurrences="7" value="a_r" /> + <ngram occurrences="7" value="a_f" /> + <ngram occurrences="7" value="_à" /> + <ngram occurrences="7" value="_ne" /> + <ngram occurrences="7" value="_g" /> + <ngram occurrences="7" value="_em_" /> +</ngrams> diff --git a/src/plugins/language/quechua.klp b/src/plugins/language/quechua.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="861" value="a" /> + <ngram occurrences="535" value="_" /> + <ngram occurrences="329" value="n" /> + <ngram occurrences="273" value="i" /> + <ngram occurrences="260" value="u" /> + <ngram occurrences="200" value="a_" /> + <ngram occurrences="196" value="h" /> + <ngram occurrences="193" value="s" /> + <ngram occurrences="190" value="t" /> + <ngram occurrences="174" value="k" /> + <ngram occurrences="171" value="y" /> + <ngram occurrences="171" value="q" /> + <ngram occurrences="163" value="c" /> + <ngram occurrences="160" value="m" /> + <ngram occurrences="159" value="p" /> + <ngram occurrences="147" value="ch" /> + <ngram occurrences="142" value="r" /> + <ngram occurrences="131" value="an" /> + <ngram occurrences="119" value="ta" /> + <ngram occurrences="107" value="qa" /> + <ngram occurrences="106" value="ay" /> + <ngram occurrences="104" value="ma" /> + <ngram occurrences="102" value="e" /> + <ngram occurrences="96" value="ha" /> + <ngram occurrences="93" value="j" /> + <ngram occurrences="91" value="pa" /> + <ngram occurrences="91" value="l" /> + <ngram occurrences="82" value="ku" /> + <ngram occurrences="77" value="na" /> + <ngram occurrences="77" value="cha" /> + <ngram occurrences="73" value="o" /> + <ngram occurrences="68" value="n_" /> + <ngram occurrences="66" value="in" /> + <ngram occurrences="62" value="un" /> + <ngram occurrences="61" value="qa_" /> + <ngram occurrences="61" value="as" /> + <ngram occurrences="59" value="ar" /> + <ngram occurrences="54" value="ta_" /> + <ngram occurrences="54" value="man" /> + <ngram occurrences="50" value="_m" /> + <ngram occurrences="50" value="_k" /> + <ngram occurrences="48" value="i_" /> + <ngram occurrences="46" value="am" /> + <ngram occurrences="46" value="ac" /> + <ngram occurrences="45" value="w" /> + <ngram occurrences="44" value="_c" /> + <ngram occurrences="43" value="ri" /> + <ngram occurrences="42" value="nt" /> + <ngram occurrences="41" value="at" /> + <ngram occurrences="41" value="_p" /> + <ngram occurrences="41" value="_ch" /> + <ngram occurrences="41" value="_a" /> + <ngram occurrences="40" value="ka" /> + <ngram occurrences="39" value="y_" /> + <ngram occurrences="39" value="wa" /> + <ngram occurrences="37" value="pi" /> + <ngram occurrences="37" value="ach" /> + <ngram occurrences="37" value="_ma" /> + <ngram occurrences="36" value="sq" /> + <ngram occurrences="36" value="nc" /> + <ngram occurrences="36" value="hu" /> + <ngram occurrences="35" value="sqa" /> + <ngram occurrences="35" value="rq" /> + <ngram occurrences="35" value="an_" /> + <ngram occurrences="35" value="aj" /> + <ngram occurrences="34" value="uy" /> + <ngram occurrences="34" value="rqa" /> + <ngram occurrences="34" value="nch" /> + <ngram occurrences="34" value="aq" /> + <ngram occurrences="34" value="_s" /> + <ngram occurrences="34" value="_j" /> + <ngram occurrences="33" value="una" /> + <ngram occurrences="33" value="ll" /> + <ngram occurrences="32" value="sp" /> + <ngram occurrences="32" value="_ka" /> + <ngram occurrences="31" value="nta" /> + <ngram occurrences="31" value="hay" /> + <ngram occurrences="31" value="chay" /> + <ngram occurrences="31" value="ata" /> + <ngram occurrences="30" value="us" /> + <ngram occurrences="30" value="u_" /> + <ngram occurrences="30" value="pa_" /> + <ngram occurrences="30" value="j_" /> + <ngram occurrences="30" value="is" /> + <ngram occurrences="29" value="ay_" /> + <ngram occurrences="28" value="ya" /> + <ngram occurrences="28" value="ni" /> + <ngram occurrences="28" value="ama" /> + <ngram occurrences="28" value="_cha" /> + <ngram occurrences="27" value="spa" /> + <ngram occurrences="27" value="s_" /> + <ngram occurrences="27" value="kun" /> + <ngram occurrences="27" value="hi" /> + <ngram occurrences="27" value="_chay" /> + <ngram occurrences="26" value="na_" /> + <ngram occurrences="26" value="la" /> + <ngram occurrences="26" value="_t" /> + <ngram occurrences="25" value="ant" /> + <ngram occurrences="25" value="aj_" /> + <ngram occurrences="24" value="ti" /> + <ngram occurrences="24" value="rqa_" /> + <ngram occurrences="24" value="q_" /> + <ngram occurrences="24" value="pi_" /> + <ngram occurrences="24" value="chu" /> + <ngram occurrences="24" value="_q" /> + <ngram occurrences="23" value="yk" /> + <ngram occurrences="23" value="nk" /> + <ngram occurrences="23" value="lla" /> + <ngram occurrences="23" value="kuna" /> + <ngram occurrences="23" value="ik" /> + <ngram occurrences="23" value="ak" /> + <ngram occurrences="23" value="_r" /> + <ngram occurrences="23" value="_i" /> + <ngram occurrences="22" value="su" /> + <ngram occurrences="22" value="spa_" /> + <ngram occurrences="22" value="he" /> + <ngram occurrences="22" value="ari" /> + <ngram occurrences="22" value="acha" /> + <ngram occurrences="22" value="_n" /> + <ngram occurrences="21" value="chi" /> + <ngram occurrences="21" value="a_m" /> + <ngram occurrences="21" value="a_c" /> + <ngram occurrences="21" value="_pa" /> + <ngram occurrences="20" value="ñ" /> + <ngram occurrences="20" value="uk" /> + <ngram occurrences="20" value="tu" /> + <ngram occurrences="20" value="taj" /> + <ngram occurrences="20" value="sqa_" /> + <ngram occurrences="20" value="ra" /> + <ngram occurrences="20" value="qan" /> + <ngram occurrences="20" value="man_" /> + <ngram occurrences="20" value="in_" /> + <ngram occurrences="20" value="im" /> + <ngram occurrences="20" value="ayk" /> + <ngram occurrences="20" value="ap" /> + <ngram occurrences="20" value="anta" /> + <ngram occurrences="20" value="anch" /> + <ngram occurrences="20" value="anc" /> + <ngram occurrences="20" value="al" /> + <ngram occurrences="20" value="a_ch" /> + <ngram occurrences="19" value="yt" /> + <ngram occurrences="19" value="nta_" /> + <ngram occurrences="19" value="ki" /> + <ngram occurrences="19" value="aw" /> + <ngram occurrences="19" value="aq_" /> + <ngram occurrences="19" value="ana" /> + <ngram occurrences="19" value="a_k" /> + <ngram occurrences="19" value="_u" /> + <ngram occurrences="18" value="yta" /> + <ngram occurrences="18" value="st" /> + <ngram occurrences="18" value="nin" /> + <ngram occurrences="18" value="awa" /> + <ngram occurrences="18" value="asqa" /> + <ngram occurrences="18" value="asq" /> + <ngram occurrences="17" value="si" /> + <ngram occurrences="17" value="kuy" /> + <ngram occurrences="17" value="iku" /> + <ngram occurrences="17" value="che" /> + <ngram occurrences="17" value="arq" /> + <ngram occurrences="17" value="a_ma" /> + <ngram occurrences="17" value="_w" /> + <ngram occurrences="17" value="_man" /> + <ngram occurrences="16" value="ña" /> + <ngram occurrences="16" value="yn" /> + <ngram occurrences="16" value="taj_" /> + <ngram occurrences="16" value="os" /> + <ngram occurrences="16" value="ncha" /> + <ngram occurrences="16" value="d" /> + <ngram occurrences="16" value="arqa" /> + <ngram occurrences="16" value="a_p" /> + <ngram occurrences="15" value="up" /> + <ngram occurrences="15" value="ru" /> + <ngram occurrences="15" value="k_" /> + <ngram occurrences="15" value="ank" /> + <ngram occurrences="15" value="_l" /> + <ngram occurrences="14" value="yku" /> + <ngram occurrences="14" value="rik" /> + <ngram occurrences="14" value="pay" /> + <ngram occurrences="14" value="nku" /> + <ngram occurrences="14" value="mp" /> + <ngram occurrences="14" value="manta" /> + <ngram occurrences="14" value="mant" /> + <ngram occurrences="14" value="ima" /> + <ngram occurrences="14" value="es" /> + <ngram occurrences="14" value="ej" /> + <ngram occurrences="14" value="ayku" /> + <ngram occurrences="14" value="aman" /> + <ngram occurrences="14" value="a_cha" /> + <ngram occurrences="14" value="_y" /> + <ngram occurrences="14" value="_h" /> + <ngram occurrences="13" value="ur" /> + <ngram occurrences="13" value="taq" /> + <ngram occurrences="13" value="pu" /> + <ngram occurrences="13" value="mu" /> + <ngram occurrences="13" value="mi" /> + <ngram occurrences="13" value="ku_" /> + <ngram occurrences="13" value="ina" /> + <ngram occurrences="13" value="ha_" /> + <ngram occurrences="13" value="g" /> + <ngram occurrences="13" value="er" /> + <ngram occurrences="13" value="en" /> + <ngram occurrences="13" value="ayt" /> + <ngram occurrences="13" value="anta_" /> + <ngram occurrences="13" value="all" /> + <ngram occurrences="13" value="a_s" /> + <ngram occurrences="13" value="a_j" /> + <ngram occurrences="13" value="a_a" /> + <ngram occurrences="13" value="_wa" /> + <ngram occurrences="13" value="_su" /> + <ngram occurrences="12" value="í" /> + <ngram occurrences="12" value="yta_" /> + <ngram occurrences="12" value="um" /> + <ngram occurrences="12" value="uch" /> + <ngram occurrences="12" value="uc" /> + <ngram occurrences="12" value="tin" /> + <ngram occurrences="12" value="taq_" /> + <ngram occurrences="12" value="nq" /> + <ngram occurrences="12" value="nan" /> + <ngram occurrences="12" value="mana" /> + <ngram occurrences="12" value="li" /> + <ngram occurrences="12" value="ju" /> + <ngram occurrences="12" value="it" /> + <ngram occurrences="12" value="erqa" /> + <ngram occurrences="12" value="erq" /> + <ngram occurrences="12" value="cha_" /> + <ngram occurrences="12" value="ayta" /> + <ngram occurrences="12" value="ancha" /> + <ngram occurrences="12" value="aku" /> + <ngram occurrences="12" value="a_ka" /> + <ngram occurrences="12" value="_pay" /> + <ngram occurrences="12" value="_ju" /> + <ngram occurrences="11" value="ut" /> + <ngram occurrences="11" value="una_" /> + <ngram occurrences="11" value="sa" /> + <ngram occurrences="11" value="ray" /> + <ngram occurrences="11" value="kay" /> + <ngram occurrences="11" value="iy" /> + <ngram occurrences="11" value="hay_" /> + <ngram occurrences="11" value="erqa_" /> + <ngram occurrences="11" value="chay_" /> + <ngram occurrences="11" value="a_man" /> + <ngram occurrences="11" value="_tu" /> + <ngram occurrences="11" value="_pu" /> + <ngram occurrences="11" value="_mana" /> + <ngram occurrences="11" value="_ll" /> + <ngram occurrences="11" value="_e" /> + <ngram occurrences="10" value="yp" /> + <ngram occurrences="10" value="yni" /> + <ngram occurrences="10" value="uma" /> + <ngram occurrences="10" value="sta" /> + <ngram occurrences="10" value="riku" /> + <ngram occurrences="10" value="re" /> + <ngram occurrences="10" value="qh" /> + <ngram occurrences="10" value="qa_k" /> + <ngram occurrences="10" value="may" /> + <ngram occurrences="10" value="kh" /> + <ngram occurrences="10" value="je" /> + <ngram occurrences="10" value="io" /> + <ngram occurrences="10" value="ia" /> + <ngram occurrences="10" value="hu_" /> + <ngram occurrences="10" value="hej" /> + <ngram occurrences="10" value="har" /> + <ngram occurrences="10" value="chu_" /> + <ngram occurrences="10" value="chej" /> + <ngram occurrences="10" value="ata_" /> + <ngram occurrences="10" value="asqa_" /> + <ngram occurrences="10" value="asp" /> + <ngram occurrences="10" value="a_q" /> + <ngram occurrences="10" value="_ñ" /> + <ngram occurrences="10" value="_ya" /> + <ngram occurrences="10" value="_sa" /> + <ngram occurrences="10" value="_ni" /> + <ngram occurrences="10" value="_ku" /> + <ngram occurrences="9" value="ypi" /> + <ngram occurrences="9" value="ynin" /> + <ngram occurrences="9" value="uya" /> + <ngram occurrences="9" value="usqa" /> + <ngram occurrences="9" value="usq" /> + <ngram occurrences="9" value="sqa_k" /> + <ngram occurrences="9" value="run" /> + <ngram occurrences="9" value="rqan" /> + <ngram occurrences="9" value="qo" /> + <ngram occurrences="9" value="qha" /> + <ngram occurrences="9" value="qay" /> + <ngram occurrences="9" value="nqa" /> + <ngram occurrences="9" value="ne" /> + <ngram occurrences="9" value="nchej" /> + <ngram occurrences="9" value="nche" /> + <ngram occurrences="9" value="mana_" /> + <ngram occurrences="9" value="mach" /> + <ngram occurrences="9" value="mac" /> + <ngram occurrences="9" value="kuna_" /> + <ngram occurrences="9" value="ki_" /> + <ngram occurrences="9" value="khu" /> + <ngram occurrences="9" value="kay_" /> + <ngram occurrences="9" value="k_a" /> + <ngram occurrences="9" value="jes" /> + <ngram occurrences="9" value="ita" /> + <ngram occurrences="9" value="ir" /> + <ngram occurrences="9" value="inc" /> + <ngram occurrences="9" value="dio" /> + <ngram occurrences="9" value="di" /> + <ngram occurrences="9" value="ayp" /> + <ngram occurrences="9" value="ayn" /> + <ngram occurrences="9" value="aspa" /> + <ngram occurrences="9" value="arqa_" /> + <ngram occurrences="9" value="anku" /> + <ngram occurrences="9" value="ana_" /> + <ngram occurrences="9" value="aman_" /> + <ngram occurrences="9" value="a_t" /> + <ngram occurrences="9" value="a_r" /> + <ngram occurrences="9" value="_ña" /> + <ngram occurrences="9" value="_qh" /> + <ngram occurrences="9" value="_jes" /> + <ngram occurrences="9" value="_je" /> + <ngram occurrences="9" value="_ima" /> + <ngram occurrences="9" value="_im" /> + <ngram occurrences="8" value="yq" /> + <ngram occurrences="8" value="yki" /> + <ngram occurrences="8" value="wan" /> + <ngram occurrences="8" value="upa" /> + <ngram occurrences="8" value="un_" /> + <ngram occurrences="8" value="ukuy" /> + <ngram occurrences="8" value="uku" /> + <ngram occurrences="8" value="tukuy" /> + <ngram occurrences="8" value="tuku" /> + <ngram occurrences="8" value="tuk" /> + <ngram occurrences="8" value="tin_" /> + <ngram occurrences="8" value="te" /> + <ngram occurrences="8" value="t_" /> + <ngram occurrences="8" value="sus" /> + <ngram occurrences="8" value="sn" /> + <ngram occurrences="8" value="qa_ch" /> + <ngram occurrences="8" value="qa_c" /> + <ngram occurrences="8" value="pac" /> + <ngram occurrences="8" value="oq" /> + <ngram occurrences="8" value="o_" /> + <ngram occurrences="8" value="nqa_" /> + <ngram occurrences="8" value="nku_" /> + <ngram occurrences="8" value="nas" /> + <ngram occurrences="8" value="n_k" /> + <ngram occurrences="8" value="manch" /> + <ngram occurrences="8" value="manc" /> + <ngram occurrences="8" value="lo" /> + <ngram occurrences="8" value="kus" /> + <ngram occurrences="8" value="kar" /> + <ngram occurrences="8" value="ja" /> + <ngram occurrences="8" value="ios" /> + <ngram occurrences="8" value="inta" /> + <ngram occurrences="8" value="int" /> + <ngram occurrences="8" value="inch" /> + <ngram occurrences="8" value="el" /> + <ngram occurrences="8" value="e_" /> + <ngram occurrences="8" value="dios" /> + <ngram occurrences="8" value="ayta_" /> + <ngram occurrences="8" value="ayq" /> + <ngram occurrences="8" value="aypi" /> + <ngram occurrences="8" value="au" /> + <ngram occurrences="8" value="ataj_" /> + <ngram occurrences="8" value="ataj" /> + <ngram occurrences="8" value="ast" /> + <ngram occurrences="8" value="as_" /> + <ngram occurrences="8" value="arik" /> + <ngram occurrences="8" value="api" /> + <ngram occurrences="8" value="apa" /> + <ngram occurrences="8" value="alla" /> + <ngram occurrences="8" value="_tuku" /> + <ngram occurrences="8" value="_tuk" /> + <ngram occurrences="8" value="_ri" /> + <ngram occurrences="8" value="_qha" /> + <ngram occurrences="8" value="_may" /> + <ngram occurrences="8" value="_lla" /> + <ngram occurrences="8" value="_kar" /> + <ngram occurrences="8" value="_dios" /> + <ngram occurrences="8" value="_dio" /> + <ngram occurrences="8" value="_di" /> + <ngram occurrences="8" value="_d" /> + <ngram occurrences="7" value="yqa" /> + <ngram occurrences="7" value="ym" /> + <ngram occurrences="7" value="y_k" /> + <ngram occurrences="7" value="was" /> + <ngram occurrences="7" value="wan_" /> + <ngram occurrences="7" value="uspa" /> + <ngram occurrences="7" value="usp" /> + <ngram occurrences="7" value="uri" /> + <ngram occurrences="7" value="unc" /> + <ngram occurrences="7" value="sqan" /> + <ngram occurrences="7" value="rí" /> + <ngram occurrences="7" value="rqa_c" /> + <ngram occurrences="7" value="rin" /> + <ngram occurrences="7" value="rayku" /> + <ngram occurrences="7" value="rayk" /> + <ngram occurrences="7" value="qa_m" /> + <ngram occurrences="7" value="qa_ka" /> + <ngram occurrences="7" value="paq" /> + <ngram occurrences="7" value="paj" /> + <ngram occurrences="7" value="pach" /> + <ngram occurrences="7" value="on" /> + <ngram occurrences="7" value="nata" /> + <ngram occurrences="7" value="nat" /> +</ngrams> diff --git a/src/plugins/language/romanian.klp b/src/plugins/language/romanian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="841" value="_" /> + <ngram occurrences="548" value="a" /> + <ngram occurrences="470" value="i" /> + <ngram occurrences="453" value="e" /> + <ngram occurrences="277" value="t" /> + <ngram occurrences="270" value="r" /> + <ngram occurrences="238" value="n" /> + <ngram occurrences="223" value="u" /> + <ngram occurrences="217" value="e_" /> + <ngram occurrences="206" value="c" /> + <ngram occurrences="200" value="s" /> + <ngram occurrences="194" value="a_" /> + <ngram occurrences="190" value="o" /> + <ngram occurrences="176" value="l" /> + <ngram occurrences="144" value="i_" /> + <ngram occurrences="132" value="d" /> + <ngram occurrences="118" value="p" /> + <ngram occurrences="118" value="m" /> + <ngram occurrences="104" value="in" /> + <ngram occurrences="104" value="_c" /> + <ngram occurrences="93" value="_s" /> + <ngram occurrences="89" value="_d" /> + <ngram occurrences="87" value="ar" /> + <ngram occurrences="75" value="_a" /> + <ngram occurrences="72" value="re" /> + <ngram occurrences="68" value="_p" /> + <ngram occurrences="67" value="de" /> + <ngram occurrences="62" value="ra" /> + <ngram occurrences="62" value="at" /> + <ngram occurrences="60" value="f" /> + <ngram occurrences="59" value="_i" /> + <ngram occurrences="55" value="n_" /> + <ngram occurrences="54" value="ta" /> + <ngram occurrences="54" value="st" /> + <ngram occurrences="52" value="ca" /> + <ngram occurrences="51" value="u_" /> + <ngram occurrences="51" value="ti" /> + <ngram occurrences="50" value="te" /> + <ngram occurrences="49" value="_de" /> + <ngram occurrences="47" value="si" /> + <ngram occurrences="47" value="de_" /> + <ngram occurrences="46" value="un" /> + <ngram occurrences="46" value="t_" /> + <ngram occurrences="45" value="_m" /> + <ngram occurrences="44" value="_o" /> + <ngram occurrences="44" value="_in" /> + <ngram occurrences="42" value="nt" /> + <ngram occurrences="42" value="g" /> + <ngram occurrences="42" value="ce" /> + <ngram occurrences="41" value="ul" /> + <ngram occurrences="41" value="ri" /> + <ngram occurrences="41" value="_ca" /> + <ngram occurrences="40" value="or" /> + <ngram occurrences="40" value="b" /> + <ngram occurrences="39" value="ma" /> + <ngram occurrences="39" value="_de_" /> + <ngram occurrences="38" value="es" /> + <ngram occurrences="38" value="_f" /> + <ngram occurrences="37" value="la" /> + <ngram occurrences="37" value="are" /> + <ngram occurrences="36" value="ta_" /> + <ngram occurrences="35" value="l_" /> + <ngram occurrences="34" value="v" /> + <ngram occurrences="34" value="tr" /> + <ngram occurrences="34" value="_si" /> + <ngram occurrences="33" value="te_" /> + <ngram occurrences="33" value="re_" /> + <ngram occurrences="33" value="in_" /> + <ngram occurrences="33" value="el" /> + <ngram occurrences="33" value="ea" /> + <ngram occurrences="33" value="ci" /> + <ngram occurrences="32" value="se" /> + <ngram occurrences="32" value="_u" /> + <ngram occurrences="32" value="_t" /> + <ngram occurrences="31" value="_e" /> + <ngram occurrences="30" value="si_" /> + <ngram occurrences="30" value="oa" /> + <ngram occurrences="30" value="ia" /> + <ngram occurrences="30" value="_l" /> + <ngram occurrences="29" value="ni" /> + <ngram occurrences="29" value="cu" /> + <ngram occurrences="29" value="are_" /> + <ngram occurrences="28" value="_si_" /> + <ngram occurrences="27" value="z" /> + <ngram occurrences="27" value="e_c" /> + <ngram occurrences="27" value="as" /> + <ngram occurrences="26" value="ne" /> + <ngram occurrences="26" value="le" /> + <ngram occurrences="26" value="da" /> + <ngram occurrences="26" value="an" /> + <ngram occurrences="26" value="_un" /> + <ngram occurrences="26" value="_ma" /> + <ngram occurrences="25" value="pe" /> + <ngram occurrences="25" value="ic" /> + <ngram occurrences="25" value="ei" /> + <ngram occurrences="24" value="ra_" /> + <ngram occurrences="24" value="r_" /> + <ngram occurrences="24" value="pa" /> + <ngram occurrences="24" value="lu" /> + <ngram occurrences="24" value="li" /> + <ngram occurrences="24" value="int" /> + <ngram occurrences="24" value="er" /> + <ngram occurrences="24" value="e_a" /> + <ngram occurrences="24" value="ac" /> + <ngram occurrences="24" value="a_s" /> + <ngram occurrences="24" value="a_d" /> + <ngram occurrences="23" value="est" /> + <ngram occurrences="22" value="ste" /> + <ngram occurrences="22" value="la_" /> + <ngram occurrences="22" value="_n" /> + <ngram occurrences="21" value="sa" /> + <ngram occurrences="21" value="ii" /> + <ngram occurrences="21" value="i_c" /> + <ngram occurrences="21" value="car" /> + <ngram occurrences="21" value="_pe" /> + <ngram occurrences="20" value="to" /> + <ngram occurrences="20" value="o_" /> + <ngram occurrences="20" value="na" /> + <ngram occurrences="20" value="it" /> + <ngram occurrences="20" value="ie" /> + <ngram occurrences="20" value="e_i" /> + <ngram occurrences="20" value="e_d" /> + <ngram occurrences="20" value="al" /> + <ngram occurrences="20" value="_se" /> + <ngram occurrences="20" value="_in_" /> + <ngram occurrences="20" value="_cu" /> + <ngram occurrences="19" value="il" /> + <ngram occurrences="19" value="en" /> + <ngram occurrences="19" value="ei_" /> + <ngram occurrences="19" value="care_" /> + <ngram occurrences="19" value="care" /> + <ngram occurrences="19" value="ai" /> + <ngram occurrences="19" value="a_c" /> + <ngram occurrences="19" value="_o_" /> + <ngram occurrences="18" value="un_" /> + <ngram occurrences="18" value="ul_" /> + <ngram occurrences="18" value="ui" /> + <ngram occurrences="18" value="se_" /> + <ngram occurrences="18" value="ii_" /> + <ngram occurrences="18" value="i_p" /> + <ngram occurrences="18" value="este" /> + <ngram occurrences="18" value="e_s" /> + <ngram occurrences="18" value="cu_" /> + <ngram occurrences="18" value="au" /> + <ngram occurrences="18" value="ata" /> + <ngram occurrences="17" value="me" /> + <ngram occurrences="17" value="lo" /> + <ngram occurrences="17" value="le_" /> + <ngram occurrences="17" value="co" /> + <ngram occurrences="17" value="ata_" /> + <ngram occurrences="17" value="ara" /> + <ngram occurrences="17" value="am" /> + <ngram occurrences="17" value="_v" /> + <ngram occurrences="17" value="_cu_" /> + <ngram occurrences="17" value="_car" /> + <ngram occurrences="17" value="_b" /> + <ngram occurrences="16" value="ui_" /> + <ngram occurrences="16" value="ste_" /> + <ngram occurrences="16" value="ru" /> + <ngram occurrences="16" value="pr" /> + <ngram occurrences="16" value="pe_" /> + <ngram occurrences="16" value="om" /> + <ngram occurrences="16" value="fa" /> + <ngram occurrences="16" value="este_" /> + <ngram occurrences="16" value="ca_" /> + <ngram occurrences="16" value="a_p" /> + <ngram occurrences="16" value="_r" /> + <ngram occurrences="16" value="_ce" /> + <ngram occurrences="16" value="_care" /> + <ngram occurrences="15" value="rt" /> + <ngram occurrences="15" value="nu" /> + <ngram occurrences="15" value="na_" /> + <ngram occurrences="15" value="i_d" /> + <ngram occurrences="15" value="h" /> + <ngram occurrences="15" value="e_p" /> + <ngram occurrences="15" value="e_in" /> + <ngram occurrences="15" value="ap" /> + <ngram occurrences="15" value="a_de" /> + <ngram occurrences="15" value="a_a" /> + <ngram occurrences="15" value="_sa" /> + <ngram occurrences="14" value="ur" /> + <ngram occurrences="14" value="tu" /> + <ngram occurrences="14" value="tra" /> + <ngram occurrences="14" value="sa_" /> + <ngram occurrences="14" value="e_f" /> + <ngram occurrences="14" value="ara_" /> + <ngram occurrences="14" value="ace" /> + <ngram occurrences="14" value="a_i" /> + <ngram occurrences="14" value="_pe_" /> + <ngram occurrences="14" value="_da" /> + <ngram occurrences="13" value="zi" /> + <ngram occurrences="13" value="sc" /> + <ngram occurrences="13" value="pi" /> + <ngram occurrences="13" value="ot" /> + <ngram occurrences="13" value="nd" /> + <ngram occurrences="13" value="n_c" /> + <ngram occurrences="13" value="mu" /> + <ngram occurrences="13" value="mi" /> + <ngram occurrences="13" value="lui" /> + <ngram occurrences="13" value="is" /> + <ngram occurrences="13" value="io" /> + <ngram occurrences="13" value="ia_" /> + <ngram occurrences="13" value="e_o" /> + <ngram occurrences="13" value="e_m" /> + <ngram occurrences="13" value="e_ca" /> + <ngram occurrences="13" value="di" /> + <ngram occurrences="13" value="ce_" /> + <ngram occurrences="13" value="au_" /> + <ngram occurrences="13" value="a_o" /> + <ngram occurrences="13" value="_un_" /> + <ngram occurrences="13" value="_la" /> + <ngram occurrences="13" value="_ca_" /> + <ngram occurrences="12" value="ve" /> + <ngram occurrences="12" value="ut" /> + <ngram occurrences="12" value="po" /> + <ngram occurrences="12" value="os" /> + <ngram occurrences="12" value="or_" /> + <ngram occurrences="12" value="oar" /> + <ngram occurrences="12" value="ne_" /> + <ngram occurrences="12" value="lui_" /> + <ngram occurrences="12" value="ie_" /> + <ngram occurrences="12" value="i_s" /> + <ngram occurrences="12" value="fo" /> + <ngram occurrences="12" value="fe" /> + <ngram occurrences="12" value="ele" /> + <ngram occurrences="12" value="ea_" /> + <ngram occurrences="12" value="ci_" /> + <ngram occurrences="12" value="bi" /> + <ngram occurrences="12" value="at_" /> + <ngram occurrences="12" value="ai_" /> + <ngram occurrences="12" value="a_in" /> + <ngram occurrences="12" value="_se_" /> + <ngram occurrences="12" value="_pa" /> + <ngram occurrences="12" value="_fa" /> + <ngram occurrences="12" value="_co" /> + <ngram occurrences="12" value="_ac" /> + <ngram occurrences="12" value="_a_" /> + <ngram occurrences="11" value="um" /> + <ngram occurrences="11" value="tat" /> + <ngram occurrences="11" value="m_" /> + <ngram occurrences="11" value="ir" /> + <ngram occurrences="11" value="et" /> + <ngram occurrences="11" value="ent" /> + <ngram occurrences="11" value="ele_" /> + <ngram occurrences="11" value="e_si" /> + <ngram occurrences="11" value="c_" /> + <ngram occurrences="11" value="_nu" /> + <ngram occurrences="11" value="_la_" /> + <ngram occurrences="11" value="_int" /> + <ngram occurrences="11" value="_di" /> + <ngram occurrences="10" value="ulu" /> + <ngram occurrences="10" value="ti_" /> + <ngram occurrences="10" value="sta" /> + <ngram occurrences="10" value="pu" /> + <ngram occurrences="10" value="op" /> + <ngram occurrences="10" value="ol" /> + <ngram occurrences="10" value="nu_" /> + <ngram occurrences="10" value="ntr" /> + <ngram occurrences="10" value="mar" /> + <ngram occurrences="10" value="iu" /> + <ngram occurrences="10" value="im" /> + <ngram occurrences="10" value="ici" /> + <ngram occurrences="10" value="i_m" /> + <ngram occurrences="10" value="i_e" /> + <ngram occurrences="10" value="i_a" /> + <ngram occurrences="10" value="ga" /> + <ngram occurrences="10" value="ec" /> + <ngram occurrences="10" value="e_de" /> + <ngram occurrences="10" value="cel" /> + <ngram occurrences="10" value="a_l" /> + <ngram occurrences="10" value="_sa_" /> + <ngram occurrences="10" value="_fo" /> + <ngram occurrences="10" value="_este" /> + <ngram occurrences="10" value="_est" /> + <ngram occurrences="10" value="_es" /> + <ngram occurrences="9" value="ului" /> + <ngram occurrences="9" value="su" /> + <ngram occurrences="9" value="s_" /> + <ngram occurrences="9" value="par" /> + <ngram occurrences="9" value="ori" /> + <ngram occurrences="9" value="on" /> + <ngram occurrences="9" value="ns" /> + <ngram occurrences="9" value="mo" /> + <ngram occurrences="9" value="it_" /> + <ngram occurrences="9" value="i_o" /> + <ngram occurrences="9" value="hi" /> + <ngram occurrences="9" value="e_ma" /> + <ngram occurrences="9" value="do" /> + <ngram occurrences="9" value="din" /> + <ngram occurrences="9" value="dat" /> + <ngram occurrences="9" value="ati" /> + <ngram occurrences="9" value="a_un" /> + <ngram occurrences="9" value="a_u" /> + <ngram occurrences="9" value="a_t" /> + <ngram occurrences="9" value="a_de_" /> + <ngram occurrences="9" value="_st" /> + <ngram occurrences="9" value="_po" /> + <ngram occurrences="9" value="_nu_" /> + <ngram occurrences="9" value="_lu" /> + <ngram occurrences="9" value="_g" /> + <ngram occurrences="9" value="_din" /> + <ngram occurrences="9" value="_ar" /> + <ngram occurrences="8" value="une" /> + <ngram occurrences="8" value="ului_" /> + <ngram occurrences="8" value="tru" /> + <ngram occurrences="8" value="tie" /> + <ngram occurrences="8" value="t_d" /> + <ngram occurrences="8" value="str" /> + <ngram occurrences="8" value="ro" /> + <ngram occurrences="8" value="ost" /> + <ngram occurrences="8" value="oc" /> + <ngram occurrences="8" value="nic" /> + <ngram occurrences="8" value="ng" /> + <ngram occurrences="8" value="nc" /> + <ngram occurrences="8" value="mul" /> + <ngram occurrences="8" value="mai_" /> + <ngram occurrences="8" value="mai" /> + <ngram occurrences="8" value="ma_" /> + <ngram occurrences="8" value="lor_" /> + <ngram occurrences="8" value="lor" /> + <ngram occurrences="8" value="ini" /> + <ngram occurrences="8" value="ine" /> + <ngram occurrences="8" value="ind" /> + <ngram occurrences="8" value="i_ma" /> + <ngram occurrences="8" value="gi" /> + <ngram occurrences="8" value="fi" /> + <ngram occurrences="8" value="em" /> + <ngram occurrences="8" value="e_v" /> + <ngram occurrences="8" value="e_si_" /> + <ngram occurrences="8" value="e_de_" /> + <ngram occurrences="8" value="da_" /> + <ngram occurrences="8" value="ate" /> + <ngram occurrences="8" value="ad" /> + <ngram occurrences="8" value="a_si" /> + <ngram occurrences="8" value="a_f" /> + <ngram occurrences="8" value="a_e" /> + <ngram occurrences="8" value="_tr" /> + <ngram occurrences="8" value="_pr" /> + <ngram occurrences="8" value="_or" /> + <ngram occurrences="8" value="_mar" /> + <ngram occurrences="8" value="_e_" /> + <ngram occurrences="8" value="_do" /> + <ngram occurrences="8" value="_ace" /> + <ngram occurrences="7" value="una" /> + <ngram occurrences="7" value="u_s" /> + <ngram occurrences="7" value="tul" /> + <ngram occurrences="7" value="tot" /> + <ngram occurrences="7" value="tor" /> + <ngram occurrences="7" value="tin" /> + <ngram occurrences="7" value="t_c" /> + <ngram occurrences="7" value="sin" /> + <ngram occurrences="7" value="si_c" /> + <ngram occurrences="7" value="rm" /> + <ngram occurrences="7" value="ri_" /> + <ngram occurrences="7" value="res" /> + <ngram occurrences="7" value="rea" /> + <ngram occurrences="7" value="ran" /> + <ngram occurrences="7" value="pri" /> + <ngram occurrences="7" value="pl" /> + <ngram occurrences="7" value="pin" /> + <ngram occurrences="7" value="nta" /> + <ngram occurrences="7" value="nde" /> + <ngram occurrences="7" value="n_ca" /> + <ngram occurrences="7" value="mp" /> + <ngram occurrences="7" value="min" /> + <ngram occurrences="7" value="lt" /> + <ngram occurrences="7" value="j" /> + <ngram occurrences="7" value="iv" /> + <ngram occurrences="7" value="ina" /> + <ngram occurrences="7" value="in_c" /> + <ngram occurrences="7" value="ilo" /> + <ngram occurrences="7" value="i_u" /> + <ngram occurrences="7" value="i_i" /> + <ngram occurrences="7" value="i_de" /> + <ngram occurrences="7" value="far" /> + <ngram occurrences="7" value="esc" /> + <ngram occurrences="7" value="e_o_" /> + <ngram occurrences="7" value="de_f" /> + <ngram occurrences="7" value="de_a" /> + <ngram occurrences="7" value="d_" /> + <ngram occurrences="7" value="cr" /> + <ngram occurrences="7" value="ch" /> + <ngram occurrences="7" value="az" /> + <ngram occurrences="7" value="ator" /> + <ngram occurrences="7" value="ato" /> + <ngram occurrences="7" value="ast" /> + <ngram occurrences="7" value="art" /> + <ngram occurrences="7" value="ar_" /> + <ngram occurrences="7" value="ani" /> + <ngram occurrences="7" value="a_si_" /> + <ngram occurrences="7" value="a_pe" /> + <ngram occurrences="7" value="a_n" /> + <ngram occurrences="7" value="_to" /> + <ngram occurrences="7" value="_mai_" /> + <ngram occurrences="7" value="_mai" /> + <ngram occurrences="7" value="_de_f" /> + <ngram occurrences="7" value="_ci" /> + <ngram occurrences="6" value="vi" /> + <ngram occurrences="6" value="up" /> + <ngram occurrences="6" value="tre" /> +</ngrams> diff --git a/src/plugins/language/rumantsch.klp b/src/plugins/language/rumantsch.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="823" value="_" /> + <ngram occurrences="504" value="a" /> + <ngram occurrences="350" value="e" /> + <ngram occurrences="332" value="i" /> + <ngram occurrences="318" value="s" /> + <ngram occurrences="298" value="n" /> + <ngram occurrences="247" value="r" /> + <ngram occurrences="209" value="a_" /> + <ngram occurrences="193" value="t" /> + <ngram occurrences="191" value="l" /> + <ngram occurrences="177" value="u" /> + <ngram occurrences="164" value="c" /> + <ngram occurrences="152" value="d" /> + <ngram occurrences="132" value="o" /> + <ngram occurrences="123" value="s_" /> + <ngram occurrences="115" value="m" /> + <ngram occurrences="113" value="g" /> + <ngram occurrences="103" value="h" /> + <ngram occurrences="98" value="n_" /> + <ngram occurrences="87" value="p" /> + <ngram occurrences="84" value="_e" /> + <ngram occurrences="82" value="_s" /> + <ngram occurrences="81" value="er" /> + <ngram occurrences="77" value="_d" /> + <ngram occurrences="75" value="v" /> + <ngram occurrences="73" value="ch" /> + <ngram occurrences="72" value="r_" /> + <ngram occurrences="64" value="in" /> + <ngram occurrences="62" value="en" /> + <ngram occurrences="61" value="_c" /> + <ngram occurrences="60" value="sc" /> + <ngram occurrences="60" value="l_" /> + <ngram occurrences="60" value="da" /> + <ngram occurrences="57" value="f" /> + <ngram occurrences="52" value="_p" /> + <ngram occurrences="51" value="_i" /> + <ngram occurrences="49" value="_m" /> + <ngram occurrences="49" value="_da" /> + <ngram occurrences="49" value="_a" /> + <ngram occurrences="48" value="ra" /> + <ngram occurrences="46" value="an" /> + <ngram occurrences="45" value="sch" /> + <ngram occurrences="44" value="_f" /> + <ngram occurrences="43" value="i_" /> + <ngram occurrences="43" value="ar" /> + <ngram occurrences="41" value="z" /> + <ngram occurrences="41" value="ma" /> + <ngram occurrences="41" value="er_" /> + <ngram occurrences="41" value="ai" /> + <ngram occurrences="40" value="la" /> + <ngram occurrences="40" value="da_" /> + <ngram occurrences="39" value="un" /> + <ngram occurrences="39" value="ta" /> + <ngram occurrences="39" value="na" /> + <ngram occurrences="37" value="nt" /> + <ngram occurrences="35" value="_t" /> + <ngram occurrences="35" value="_l" /> + <ngram occurrences="35" value="_da_" /> + <ngram occurrences="34" value="t_" /> + <ngram occurrences="33" value="b" /> + <ngram occurrences="33" value="as" /> + <ngram occurrences="32" value="e_" /> + <ngram occurrences="29" value="es" /> + <ngram occurrences="28" value="il" /> + <ngram occurrences="28" value="ia" /> + <ngram occurrences="28" value="d_" /> + <ngram occurrences="28" value="al" /> + <ngram occurrences="27" value="va" /> + <ngram occurrences="27" value="re" /> + <ngram occurrences="27" value="is" /> + <ngram occurrences="26" value="st" /> + <ngram occurrences="26" value="_v" /> + <ngram occurrences="26" value="_n" /> + <ngram occurrences="25" value="pe" /> + <ngram occurrences="25" value="gl" /> + <ngram occurrences="25" value="el" /> + <ngram occurrences="25" value="ei" /> + <ngram occurrences="25" value="de" /> + <ngram occurrences="25" value="cu" /> + <ngram occurrences="24" value="un_" /> + <ngram occurrences="24" value="sa" /> + <ngram occurrences="24" value="or" /> + <ngram occurrences="24" value="he" /> + <ngram occurrences="24" value="ha" /> + <ngram occurrences="24" value="di" /> + <ngram occurrences="24" value="_sc" /> + <ngram occurrences="24" value="_g" /> + <ngram occurrences="23" value="ü" /> + <ngram occurrences="23" value="ve" /> + <ngram occurrences="23" value="te" /> + <ngram occurrences="23" value="as_" /> + <ngram occurrences="23" value="_in" /> + <ngram occurrences="22" value="ts" /> + <ngram occurrences="22" value="ss" /> + <ngram occurrences="22" value="ad" /> + <ngram occurrences="22" value="_o" /> + <ngram occurrences="21" value="tg" /> + <ngram occurrences="21" value="ra_" /> + <ngram occurrences="21" value="per" /> + <ngram occurrences="21" value="on" /> + <ngram occurrences="21" value="g_" /> + <ngram occurrences="21" value="ain" /> + <ngram occurrences="20" value="ur" /> + <ngram occurrences="20" value="u_" /> + <ngram occurrences="20" value="rt" /> + <ngram occurrences="20" value="ns" /> + <ngram occurrences="20" value="ig" /> + <ngram occurrences="20" value="en_" /> + <ngram occurrences="20" value="_en" /> + <ngram occurrences="19" value="qu" /> + <ngram occurrences="19" value="q" /> + <ngram occurrences="19" value="ng" /> + <ngram occurrences="19" value="na_" /> + <ngram occurrences="19" value="in_" /> + <ngram occurrences="19" value="h_" /> + <ngram occurrences="18" value="ti" /> + <ngram occurrences="18" value="rs" /> + <ngram occurrences="18" value="o_" /> + <ngram occurrences="18" value="li" /> + <ngram occurrences="18" value="iv" /> + <ngram occurrences="18" value="ir" /> + <ngram occurrences="18" value="che" /> + <ngram occurrences="18" value="ch_" /> + <ngram occurrences="18" value="a_e" /> + <ngram occurrences="18" value="a_c" /> + <ngram occurrences="18" value="_h" /> + <ngram occurrences="18" value="_e_" /> + <ngram occurrences="18" value="_ch" /> + <ngram occurrences="18" value="_b" /> + <ngram occurrences="17" value="to" /> + <ngram occurrences="17" value="se" /> + <ngram occurrences="17" value="s_e" /> + <ngram occurrences="17" value="mi" /> + <ngram occurrences="17" value="la_" /> + <ngram occurrences="17" value="ie" /> + <ngram occurrences="17" value="gi" /> + <ngram occurrences="17" value="eg" /> + <ngram occurrences="17" value="_r" /> + <ngram occurrences="17" value="_qu" /> + <ngram occurrences="17" value="_q" /> + <ngram occurrences="17" value="_pe" /> + <ngram occurrences="17" value="_ma" /> + <ngram occurrences="17" value="_cu" /> + <ngram occurrences="16" value="us" /> + <ngram occurrences="16" value="ta_" /> + <ngram occurrences="16" value="ri" /> + <ngram occurrences="16" value="pa" /> + <ngram occurrences="16" value="ll" /> + <ngram occurrences="16" value="iu" /> + <ngram occurrences="16" value="ha_" /> + <ngram occurrences="16" value="et" /> + <ngram occurrences="16" value="el_" /> + <ngram occurrences="16" value="_u" /> + <ngram occurrences="16" value="_per" /> + <ngram occurrences="15" value="za" /> + <ngram occurrences="15" value="vi" /> + <ngram occurrences="15" value="ns_" /> + <ngram occurrences="15" value="me" /> + <ngram occurrences="15" value="ls_" /> + <ngram occurrences="15" value="ls" /> + <ngram occurrences="15" value="igl" /> + <ngram occurrences="15" value="ia_" /> + <ngram occurrences="15" value="fi" /> + <ngram occurrences="15" value="ent" /> + <ngram occurrences="15" value="ei_" /> + <ngram occurrences="15" value="co" /> + <ngram occurrences="15" value="cha" /> + <ngram occurrences="15" value="a_s" /> + <ngram occurrences="15" value="a_m" /> + <ngram occurrences="15" value="a_f" /> + <ngram occurrences="15" value="_il" /> + <ngram occurrences="14" value="sa_" /> + <ngram occurrences="14" value="s_d" /> + <ngram occurrences="14" value="nu" /> + <ngram occurrences="14" value="ni" /> + <ngram occurrences="14" value="n_m" /> + <ngram occurrences="14" value="mai" /> + <ngram occurrences="14" value="ic" /> + <ngram occurrences="14" value="hi" /> + <ngram occurrences="14" value="gn" /> + <ngram occurrences="14" value="ga" /> + <ngram occurrences="14" value="at" /> + <ngram occurrences="14" value="a_p" /> + <ngram occurrences="13" value="va_" /> + <ngram occurrences="13" value="su" /> + <ngram occurrences="13" value="sta" /> + <ngram occurrences="13" value="pr" /> + <ngram occurrences="13" value="per_" /> + <ngram occurrences="13" value="nd" /> + <ngram occurrences="13" value="it" /> + <ngram occurrences="13" value="int" /> + <ngram occurrences="13" value="ed" /> + <ngram occurrences="13" value="ca" /> + <ngram occurrences="13" value="an_" /> + <ngram occurrences="13" value="a_l" /> + <ngram occurrences="13" value="_per_" /> + <ngram occurrences="13" value="_mi" /> + <ngram occurrences="13" value="_la" /> + <ngram occurrences="12" value="uo" /> + <ngram occurrences="12" value="ue" /> + <ngram occurrences="12" value="ts_" /> + <ngram occurrences="12" value="si" /> + <ngram occurrences="12" value="rt_" /> + <ngram occurrences="12" value="que" /> + <ngram occurrences="12" value="ot" /> + <ngram occurrences="12" value="nz" /> + <ngram occurrences="12" value="mo" /> + <ngram occurrences="12" value="lu" /> + <ngram occurrences="12" value="il_" /> + <ngram occurrences="12" value="am" /> + <ngram occurrences="12" value="a_t" /> + <ngram occurrences="12" value="a_d" /> + <ngram occurrences="12" value="_sch" /> + <ngram occurrences="12" value="_fi" /> + <ngram occurrences="12" value="_di" /> + <ngram occurrences="11" value="ut" /> + <ngram occurrences="11" value="um" /> + <ngram occurrences="11" value="scha" /> + <ngram occurrences="11" value="s_s" /> + <ngram occurrences="11" value="s_a" /> + <ngram occurrences="11" value="ro" /> + <ngram occurrences="11" value="lla" /> + <ngram occurrences="11" value="le" /> + <ngram occurrences="11" value="iss" /> + <ngram occurrences="11" value="gl_" /> + <ngram occurrences="11" value="fa" /> + <ngram occurrences="11" value="era" /> + <ngram occurrences="11" value="chi" /> + <ngram occurrences="11" value="av" /> + <ngram occurrences="11" value="au" /> + <ngram occurrences="11" value="ar_" /> + <ngram occurrences="11" value="a_i" /> + <ngram occurrences="11" value="_ve" /> + <ngram occurrences="11" value="_que" /> + <ngram occurrences="11" value="_pa" /> + <ngram occurrences="11" value="_nu" /> + <ngram occurrences="11" value="_in_" /> + <ngram occurrences="10" value="ün" /> + <ngram occurrences="10" value="zi" /> + <ngram occurrences="10" value="za_" /> + <ngram occurrences="10" value="x" /> + <ngram occurrences="10" value="ter" /> + <ngram occurrences="10" value="s_da" /> + <ngram occurrences="10" value="s_c" /> + <ngram occurrences="10" value="pi" /> + <ngram occurrences="10" value="nza" /> + <ngram occurrences="10" value="ng_" /> + <ngram occurrences="10" value="mp" /> + <ngram occurrences="10" value="man" /> + <ngram occurrences="10" value="main" /> + <ngram occurrences="10" value="lla_" /> + <ngram occurrences="10" value="iun" /> + <ngram occurrences="10" value="igl_" /> + <ngram occurrences="10" value="gia" /> + <ngram occurrences="10" value="ge" /> + <ngram occurrences="10" value="fe" /> + <ngram occurrences="10" value="ev" /> + <ngram occurrences="10" value="esc" /> + <ngram occurrences="10" value="cl" /> + <ngram occurrences="10" value="be" /> + <ngram occurrences="10" value="a_v" /> + <ngram occurrences="10" value="a_g" /> + <ngram occurrences="10" value="_l_" /> + <ngram occurrences="10" value="_il_" /> + <ngram occurrences="10" value="_de" /> + <ngram occurrences="9" value="tsch" /> + <ngram occurrences="9" value="tsc" /> + <ngram occurrences="9" value="sch_" /> + <ngram occurrences="9" value="rs_" /> + <ngram occurrences="9" value="os" /> + <ngram occurrences="9" value="om" /> + <ngram occurrences="9" value="nta" /> + <ngram occurrences="9" value="n_e" /> + <ngram occurrences="9" value="n_d" /> + <ngram occurrences="9" value="n_a" /> + <ngram occurrences="9" value="m_" /> + <ngram occurrences="9" value="las" /> + <ngram occurrences="9" value="l_s" /> + <ngram occurrences="9" value="ir_" /> + <ngram occurrences="9" value="ing" /> + <ngram occurrences="9" value="i_d" /> + <ngram occurrences="9" value="gli" /> + <ngram occurrences="9" value="esch" /> + <ngram occurrences="9" value="em" /> + <ngram occurrences="9" value="des" /> + <ngram occurrences="9" value="cun" /> + <ngram occurrences="9" value="c_" /> + <ngram occurrences="9" value="ama" /> + <ngram occurrences="9" value="al_" /> + <ngram occurrences="9" value="a_b" /> + <ngram occurrences="9" value="_su" /> + <ngram occurrences="9" value="_st" /> + <ngram occurrences="9" value="_me" /> + <ngram occurrences="9" value="_ha_" /> + <ngram occurrences="9" value="_ha" /> + <ngram occurrences="9" value="_fa" /> + <ngram occurrences="9" value="_en_" /> + <ngram occurrences="9" value="_an" /> + <ngram occurrences="8" value="ver" /> + <ngram occurrences="8" value="tg_" /> + <ngram occurrences="8" value="ssa" /> + <ngram occurrences="8" value="sp" /> + <ngram occurrences="8" value="schi" /> + <ngram occurrences="8" value="s_e_" /> + <ngram occurrences="8" value="rm" /> + <ngram occurrences="8" value="r_a" /> + <ngram occurrences="8" value="pl" /> + <ngram occurrences="8" value="par" /> + <ngram occurrences="8" value="no" /> + <ngram occurrences="8" value="nc" /> + <ngram occurrences="8" value="n_s" /> + <ngram occurrences="8" value="n_p" /> + <ngram occurrences="8" value="n_i" /> + <ngram occurrences="8" value="min" /> + <ngram occurrences="8" value="ier" /> + <ngram occurrences="8" value="eu" /> + <ngram occurrences="8" value="ed_" /> + <ngram occurrences="8" value="desc" /> + <ngram occurrences="8" value="d_e" /> + <ngram occurrences="8" value="all" /> + <ngram occurrences="8" value="aint" /> + <ngram occurrences="8" value="ad_" /> + <ngram occurrences="8" value="_ün" /> + <ngram occurrences="8" value="_ü" /> + <ngram occurrences="8" value="_vi" /> + <ngram occurrences="8" value="_tg" /> + <ngram occurrences="8" value="_se" /> + <ngram occurrences="8" value="_sa" /> + <ngram occurrences="8" value="_gi" /> + <ngram occurrences="8" value="_fe" /> + <ngram occurrences="8" value="_er" /> + <ngram occurrences="8" value="_ed_" /> + <ngram occurrences="8" value="_ed" /> + <ngram occurrences="8" value="_cun" /> + <ngram occurrences="8" value="_co" /> + <ngram occurrences="7" value="vai" /> + <ngram occurrences="7" value="us_" /> + <ngram occurrences="7" value="ura" /> + <ngram occurrences="7" value="uel" /> + <ngram occurrences="7" value="sta_" /> + <ngram occurrences="7" value="sen" /> + <ngram occurrences="7" value="sche" /> + <ngram occurrences="7" value="s_p" /> + <ngram occurrences="7" value="s_da_" /> + <ngram occurrences="7" value="ran" /> + <ngram occurrences="7" value="r_d" /> + <ngram occurrences="7" value="quel" /> + <ngram occurrences="7" value="ors" /> + <ngram occurrences="7" value="nza_" /> + <ngram occurrences="7" value="nts" /> + <ngram occurrences="7" value="nte" /> + <ngram occurrences="7" value="nt_" /> + <ngram occurrences="7" value="nas" /> + <ngram occurrences="7" value="n_ma" /> + <ngram occurrences="7" value="n_da" /> + <ngram occurrences="7" value="lo" /> + <ngram occurrences="7" value="las_" /> + <ngram occurrences="7" value="lar" /> + <ngram occurrences="7" value="l_c" /> + <ngram occurrences="7" value="ins" /> + <ngram occurrences="7" value="ing_" /> + <ngram occurrences="7" value="ina" /> + <ngram occurrences="7" value="im" /> + <ngram occurrences="7" value="id" /> + <ngram occurrences="7" value="gn_" /> + <ngram occurrences="7" value="fo" /> + <ngram occurrences="7" value="eva" /> + <ngram occurrences="7" value="ert" /> + <ngram occurrences="7" value="end" /> + <ngram occurrences="7" value="di_" /> + <ngram occurrences="7" value="desch" /> + <ngram occurrences="7" value="cha_" /> + <ngram occurrences="7" value="az" /> + <ngram occurrences="7" value="ava" /> + <ngram occurrences="7" value="ag" /> + <ngram occurrences="7" value="ac" /> + <ngram occurrences="7" value="a_ma" /> + <ngram occurrences="7" value="a_da" /> + <ngram occurrences="7" value="a_cu" /> + <ngram occurrences="7" value="_te" /> + <ngram occurrences="7" value="_re" /> + <ngram occurrences="7" value="_quel" /> + <ngram occurrences="7" value="_pr" /> + <ngram occurrences="7" value="_or" /> + <ngram occurrences="7" value="_na" /> + <ngram occurrences="7" value="_mo" /> + <ngram occurrences="7" value="_lu" /> + <ngram occurrences="7" value="_ins" /> + <ngram occurrences="7" value="_fo" /> + <ngram occurrences="7" value="_ei_" /> + <ngram occurrences="7" value="_ei" /> + <ngram occurrences="7" value="_cl" /> + <ngram occurrences="7" value="_ch_" /> + <ngram occurrences="6" value="è" /> + <ngram occurrences="6" value="ziun" /> + <ngram occurrences="6" value="ziu" /> + <ngram occurrences="6" value="z_" /> + <ngram occurrences="6" value="vair" /> + <ngram occurrences="6" value="ura_" /> + <ngram occurrences="6" value="ur_" /> +</ngrams> diff --git a/src/plugins/language/russian.klp b/src/plugins/language/russian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="873" value="_" /> + <ngram occurrences="533" value="ï" /> + <ngram occurrences="411" value="å" /> + <ngram occurrences="385" value="á" /> + <ngram occurrences="324" value="ô" /> + <ngram occurrences="302" value="é" /> + <ngram occurrences="296" value="î" /> + <ngram occurrences="243" value="ó" /> + <ngram occurrences="206" value="ò" /> + <ngram occurrences="188" value="ì" /> + <ngram occurrences="160" value="ï_" /> + <ngram occurrences="150" value="ë" /> + <ngram occurrences="149" value="í" /> + <ngram occurrences="144" value="ð" /> + <ngram occurrences="119" value="ä" /> + <ngram occurrences="118" value="á_" /> + <ngram occurrences="116" value="_ð" /> + <ngram occurrences="100" value="å_" /> + <ngram occurrences="98" value="ç" /> + <ngram occurrences="96" value="õ" /> + <ngram occurrences="86" value="_ó" /> + <ngram occurrences="81" value="ù" /> + <ngram occurrences="80" value="é_" /> + <ngram occurrences="79" value="ø" /> + <ngram occurrences="76" value="þ" /> + <ngram occurrences="75" value="ôï" /> + <ngram occurrences="75" value="ñ" /> + <ngram occurrences="74" value="_ï" /> + <ngram occurrences="71" value="óô" /> + <ngram occurrences="67" value="_î" /> + <ngram occurrences="63" value="â" /> + <ngram occurrences="63" value="_á" /> + <ngram occurrences="59" value="ú" /> + <ngram occurrences="56" value="òá" /> + <ngram occurrences="55" value="îï" /> + <ngram occurrences="55" value="ê" /> + <ngram occurrences="53" value="ðï" /> + <ngram occurrences="52" value="îá" /> + <ngram occurrences="51" value="ô_" /> + <ngram occurrences="49" value="ø_" /> + <ngram occurrences="49" value="ôá" /> + <ngram occurrences="49" value="ñ_" /> + <ngram occurrences="47" value="ëï" /> + <ngram occurrences="47" value="_ô" /> + <ngram occurrences="47" value="_í" /> + <ngram occurrences="46" value="òï" /> + <ngram occurrences="45" value="îå" /> + <ngram occurrences="45" value="_ðï" /> + <ngram occurrences="45" value="_é" /> + <ngram occurrences="44" value="ö" /> + <ngram occurrences="44" value="í_" /> + <ngram occurrences="44" value="ê_" /> + <ngram occurrences="44" value="çï" /> + <ngram occurrences="42" value="ïì" /> + <ngram occurrences="41" value="åî" /> + <ngram occurrences="40" value="è" /> + <ngram occurrences="39" value="ïó" /> + <ngram occurrences="39" value="îé" /> + <ngram occurrences="39" value="åô" /> + <ngram occurrences="39" value="áî" /> + <ngram occurrences="39" value="_ä" /> + <ngram occurrences="38" value="ôå" /> + <ngram occurrences="37" value="ïç" /> + <ngram occurrences="36" value="ðò" /> + <ngram occurrences="36" value="áô" /> + <ngram occurrences="35" value="åó" /> + <ngram occurrences="34" value="ìå" /> + <ngram occurrences="34" value="åò" /> + <ngram occurrences="34" value="_ðò" /> + <ngram occurrences="34" value="_å" /> + <ngram occurrences="32" value="ïí" /> + <ngram occurrences="32" value="íï" /> + <ngram occurrences="32" value="ìï" /> + <ngram occurrences="32" value="áì" /> + <ngram occurrences="31" value="òå" /> + <ngram occurrences="31" value="éî" /> + <ngram occurrences="31" value="åì" /> + <ngram occurrences="30" value="ôï_" /> + <ngram occurrences="30" value="ïî" /> + <ngram occurrences="29" value="þå" /> + <ngram occurrences="29" value="óë" /> + <ngram occurrences="29" value="ïä" /> + <ngram occurrences="29" value="ìø" /> + <ngram occurrences="29" value="çï_" /> + <ngram occurrences="29" value="_ë" /> + <ngram occurrences="28" value="îï_" /> + <ngram occurrences="28" value="è_" /> + <ngram occurrences="28" value="_þ" /> + <ngram occurrences="27" value="ôø" /> + <ngram occurrences="27" value="ï_ó" /> + <ngram occurrences="26" value="ôø_" /> + <ngram occurrences="26" value="òé" /> + <ngram occurrences="26" value="_â" /> + <ngram occurrences="25" value="îá_" /> + <ngram occurrences="25" value="äï" /> + <ngram occurrences="25" value="_ù" /> + <ngram occurrences="25" value="_ò" /> + <ngram occurrences="24" value="õ_" /> + <ngram occurrences="24" value="ë_" /> + <ngram occurrences="24" value="ã" /> + <ngram occurrences="24" value="_îá" /> + <ngram occurrences="23" value="öå" /> + <ngram occurrences="23" value="óå" /> + <ngram occurrences="23" value="ïô" /> + <ngram occurrences="23" value="ï_ð" /> + <ngram occurrences="23" value="íå" /> + <ngram occurrences="23" value="ëá" /> + <ngram occurrences="22" value="ïçï" /> + <ngram occurrences="22" value="ìé" /> + <ngram occurrences="22" value="éå" /> + <ngram occurrences="22" value="æ" /> + <ngram occurrences="22" value="åí" /> + <ngram occurrences="22" value="äå" /> + <ngram occurrences="22" value="_îå" /> + <ngram occurrences="22" value="_ì" /> + <ngram occurrences="21" value="ù_" /> + <ngram occurrences="21" value="åô_" /> + <ngram occurrences="21" value="_ç" /> + <ngram occurrences="21" value="_á_" /> + <ngram occurrences="20" value="ý" /> + <ngram occurrences="20" value="ðå" /> + <ngram occurrences="20" value="ïò" /> + <ngram occurrences="20" value="ïê" /> + <ngram occurrences="20" value="à" /> + <ngram occurrences="19" value="þôï" /> + <ngram occurrences="19" value="þô" /> + <ngram occurrences="19" value="ôé" /> + <ngram occurrences="19" value="ïçï_" /> + <ngram occurrences="19" value="îù" /> + <ngram occurrences="19" value="ìá" /> + <ngram occurrences="19" value="_þôï" /> + <ngram occurrences="19" value="_þô" /> + <ngram occurrences="19" value="_ôï" /> + <ngram occurrences="19" value="_íï" /> + <ngram occurrences="19" value="_é_" /> + <ngram occurrences="18" value="ó_" /> + <ngram occurrences="18" value="ðá" /> + <ngram occurrences="18" value="äá" /> + <ngram occurrences="18" value="áí" /> + <ngram occurrences="18" value="áë" /> + <ngram occurrences="18" value="_õ" /> + <ngram occurrences="18" value="_óô" /> + <ngram occurrences="17" value="ü" /> + <ngram occurrences="17" value="û" /> + <ngram occurrences="17" value="ôò" /> + <ngram occurrences="17" value="óï" /> + <ngram occurrences="17" value="ðòï" /> + <ngram occurrences="17" value="ïê_" /> + <ngram occurrences="17" value="íé" /> + <ngram occurrences="17" value="éô" /> + <ngram occurrences="17" value="_ü" /> + <ngram occurrences="16" value="þôï_" /> + <ngram occurrences="16" value="þá" /> + <ngram occurrences="16" value="úá" /> + <ngram occurrences="16" value="ëé" /> + <ngram occurrences="16" value="éì" /> + <ngram occurrences="16" value="åä" /> + <ngram occurrences="16" value="áò" /> + <ngram occurrences="16" value="_þôï_" /> + <ngram occurrences="16" value="_ðá" /> + <ngram occurrences="15" value="óôá" /> + <ngram occurrences="15" value="óô_" /> + <ngram occurrences="15" value="óì" /> + <ngram occurrences="15" value="ìï_" /> + <ngram occurrences="15" value="ì_" /> + <ngram occurrences="15" value="éé_" /> + <ngram occurrences="15" value="éé" /> + <ngram occurrences="15" value="éå_" /> + <ngram occurrences="15" value="åóô" /> + <ngram occurrences="15" value="åç" /> + <ngram occurrences="15" value="âù" /> + <ngram occurrences="15" value="á_ð" /> + <ngram occurrences="15" value="_óå" /> + <ngram occurrences="15" value="_ðòï" /> + <ngram occurrences="15" value="_äï" /> + <ngram occurrences="14" value="óëï" /> + <ngram occurrences="14" value="éó" /> + <ngram occurrences="14" value="éí" /> + <ngram occurrences="14" value="éè" /> + <ngram occurrences="14" value="çé" /> + <ngram occurrences="14" value="çá" /> + <ngram occurrences="14" value="å_ó" /> + <ngram occurrences="14" value="âï" /> + <ngram occurrences="14" value="áú" /> + <ngram occurrences="14" value="áó" /> + <ngram occurrences="14" value="_ôá" /> + <ngram occurrences="14" value="_îá_" /> + <ngram occurrences="13" value="üô" /> + <ngram occurrences="13" value="óñ" /> + <ngram occurrences="13" value="ïþ" /> + <ngram occurrences="13" value="ïö" /> + <ngram occurrences="13" value="ïí_" /> + <ngram occurrences="13" value="îå_" /> + <ngram occurrences="13" value="ëô" /> + <ngram occurrences="13" value="åë" /> + <ngram occurrences="13" value="åê" /> + <ngram occurrences="13" value="á_î" /> + <ngram occurrences="13" value="_üô" /> + <ngram occurrences="13" value="_ú" /> + <ngram occurrences="13" value="_òá" /> + <ngram occurrences="13" value="_ëï" /> + <ngram occurrences="12" value="ôáë" /> + <ngram occurrences="12" value="óñ_" /> + <ngram occurrences="12" value="òï_" /> + <ngram occurrences="12" value="òá_" /> + <ngram occurrences="12" value="ïóô" /> + <ngram occurrences="12" value="ïâ" /> + <ngram occurrences="12" value="îø" /> + <ngram occurrences="12" value="íá" /> + <ngram occurrences="12" value="ëï_" /> + <ngram occurrences="12" value="éë" /> + <ngram occurrences="12" value="éè_" /> + <ngram occurrences="12" value="åú" /> + <ngram occurrences="12" value="äï_" /> + <ngram occurrences="12" value="á_ó" /> + <ngram occurrences="12" value="á_ï" /> + <ngram occurrences="12" value="_ôáë" /> + <ngram occurrences="12" value="_ðå" /> + <ngram occurrences="11" value="ùè_" /> + <ngram occurrences="11" value="ùè" /> + <ngram occurrences="11" value="óôï" /> + <ngram occurrences="11" value="òõ" /> + <ngram occurrences="11" value="ñô" /> + <ngram occurrences="11" value="ðåò" /> + <ngram occurrences="11" value="ïìø" /> + <ngram occurrences="11" value="ïë" /> + <ngram occurrences="11" value="ï_ðï" /> + <ngram occurrences="11" value="îïç" /> + <ngram occurrences="11" value="ìñ" /> + <ngram occurrences="11" value="ìé_" /> + <ngram occurrences="11" value="é_î" /> + <ngram occurrences="11" value="åîé" /> + <ngram occurrences="11" value="åê_" /> + <ngram occurrences="11" value="åçï" /> + <ngram occurrences="11" value="åå" /> + <ngram occurrences="11" value="å_ð" /> + <ngram occurrences="11" value="å_ï" /> + <ngram occurrences="11" value="äé" /> + <ngram occurrences="11" value="ãé" /> + <ngram occurrences="11" value="áòá" /> + <ngram occurrences="11" value="áñ_" /> + <ngram occurrences="11" value="áñ" /> + <ngram occurrences="11" value="áìø" /> + <ngram occurrences="11" value="_úá" /> + <ngram occurrences="11" value="_íå" /> + <ngram occurrences="10" value="þåî" /> + <ngram occurrences="10" value="ú_" /> + <ngram occurrences="10" value="øî" /> + <ngram occurrences="10" value="õþ" /> + <ngram occurrences="10" value="óî" /> + <ngram occurrences="10" value="ïþå" /> + <ngram occurrences="10" value="ïé" /> + <ngram occurrences="10" value="ïå" /> + <ngram occurrences="10" value="ï_ù" /> + <ngram occurrences="10" value="ï_î" /> + <ngram occurrences="10" value="ï_á" /> + <ngram occurrences="10" value="îø_" /> + <ngram occurrences="10" value="îô" /> + <ngram occurrences="10" value="îî" /> + <ngram occurrences="10" value="ìøî" /> + <ngram occurrences="10" value="ê_ó" /> + <ngram occurrences="10" value="ê_ð" /> + <ngram occurrences="10" value="é_ð" /> + <ngram occurrences="10" value="åîø_" /> + <ngram occurrences="10" value="åîø" /> + <ngram occurrences="10" value="åí_" /> + <ngram occurrences="10" value="åçï_" /> + <ngram occurrences="10" value="äî" /> + <ngram occurrences="10" value="äá_" /> + <ngram occurrences="10" value="áí_" /> + <ngram occurrences="10" value="_ö" /> + <ngram occurrences="10" value="_îï" /> + <ngram occurrences="9" value="þåîø_" /> + <ngram occurrences="9" value="þåîø" /> + <ngram occurrences="9" value="ýå" /> + <ngram occurrences="9" value="üôï" /> + <ngram occurrences="9" value="ûé" /> + <ngram occurrences="9" value="ùô" /> + <ngram occurrences="9" value="ôó" /> + <ngram occurrences="9" value="ôïò" /> + <ngram occurrences="9" value="ôåò" /> + <ngram occurrences="9" value="ôáô" /> + <ngram occurrences="9" value="óëé" /> + <ngram occurrences="9" value="òáú" /> + <ngram occurrences="9" value="ðòé" /> + <ngram occurrences="9" value="ðòå" /> + <ngram occurrences="9" value="ðïì" /> + <ngram occurrences="9" value="ðï_" /> + <ngram occurrences="9" value="ïþåîø" /> + <ngram occurrences="9" value="ïþåî" /> + <ngram occurrences="9" value="ïöå" /> + <ngram occurrences="9" value="ïìå" /> + <ngram occurrences="9" value="ïçé" /> + <ngram occurrences="9" value="ï_ô" /> + <ngram occurrences="9" value="ï_ðò" /> + <ngram occurrences="9" value="ï_ï" /> + <ngram occurrences="9" value="îïçï_" /> + <ngram occurrences="9" value="îïçï" /> + <ngram occurrences="9" value="îéå" /> + <ngram occurrences="9" value="íïó" /> + <ngram occurrences="9" value="ìá_" /> + <ngram occurrences="9" value="ëá_" /> + <ngram occurrences="9" value="åòå" /> + <ngram occurrences="9" value="å_ô" /> + <ngram occurrences="9" value="áôå" /> + <ngram occurrences="9" value="áæ" /> + <ngram occurrences="9" value="á_ì" /> + <ngram occurrences="9" value="_üôï" /> + <ngram occurrences="9" value="_óï" /> + <ngram occurrences="9" value="_óì" /> + <ngram occurrences="9" value="_ó_" /> + <ngram occurrences="9" value="_ðòé" /> + <ngram occurrences="9" value="_ðòå" /> + <ngram occurrences="9" value="_ïþåî" /> + <ngram occurrences="9" value="_ïþå" /> + <ngram occurrences="9" value="_ïþ" /> + <ngram occurrences="9" value="_âù" /> + <ngram occurrences="9" value="_âï" /> + <ngram occurrences="8" value="ýé" /> + <ngram occurrences="8" value="úá_" /> + <ngram occurrences="8" value="ùí_" /> + <ngram occurrences="8" value="ùí" /> + <ngram occurrences="8" value="ùê_" /> + <ngram occurrences="8" value="ùê" /> + <ngram occurrences="8" value="ø_ó" /> + <ngram occurrences="8" value="ø_ï" /> + <ngram occurrences="8" value="öé" /> + <ngram occurrences="8" value="öåî" /> + <ngram occurrences="8" value="öå_" /> + <ngram occurrences="8" value="õô" /> + <ngram occurrences="8" value="õà" /> + <ngram occurrences="8" value="ôõ" /> + <ngram occurrences="8" value="ôóñ_" /> + <ngram occurrences="8" value="ôóñ" /> + <ngram occurrences="8" value="ôñ" /> + <ngram occurrences="8" value="ôïì" /> + <ngram occurrences="8" value="ôåì" /> + <ngram occurrences="8" value="ôáì" /> + <ngram occurrences="8" value="ôá_" /> + <ngram occurrences="8" value="óôå" /> + <ngram occurrences="8" value="óá" /> + <ngram occurrences="8" value="ò_" /> + <ngram occurrences="8" value="ðá_" /> + <ngram occurrences="8" value="ïòï" /> + <ngram occurrences="8" value="ïæ" /> + <ngram occurrences="8" value="ï_ò" /> + <ngram occurrences="8" value="îñ" /> + <ngram occurrences="8" value="îã" /> + <ngram occurrences="8" value="îáñ_" /> + <ngram occurrences="8" value="îáñ" /> + <ngram occurrences="8" value="î_" /> + <ngram occurrences="8" value="íïö" /> + <ngram occurrences="8" value="íî" /> + <ngram occurrences="8" value="í_ð" /> + <ngram occurrences="8" value="ìåô" /> + <ngram occurrences="8" value="ëò" /> + <ngram occurrences="8" value="éñ" /> + <ngram occurrences="8" value="éê_" /> + <ngram occurrences="8" value="éê" /> + <ngram occurrences="8" value="éâ" /> + <ngram occurrences="8" value="é_ï" /> + <ngram occurrences="8" value="çò" /> + <ngram occurrences="8" value="çáî" /> + <ngram occurrences="8" value="æçáî" /> + <ngram occurrences="8" value="æçá" /> + <ngram occurrences="8" value="æç" /> + <ngram occurrences="8" value="åå_" /> + <ngram occurrences="8" value="å_î" /> + <ngram occurrences="8" value="ãå" /> + <ngram occurrences="8" value="âïì" /> + <ngram occurrences="8" value="âå" /> + <ngram occurrences="8" value="áôø_" /> + <ngram occurrences="8" value="áôø" /> + <ngram occurrences="8" value="áóô" /> + <ngram occurrences="8" value="áîå" /> + <ngram occurrences="8" value="áìøî" /> + <ngram occurrences="8" value="áæçáî" /> + <ngram occurrences="8" value="áæçá" /> + <ngram occurrences="8" value="áæç" /> + <ngram occurrences="8" value="á_é" /> + <ngram occurrences="8" value="_óë" /> + <ngram occurrences="8" value="_ïô" /> + <ngram occurrences="8" value="_ïä" /> + <ngram occurrences="8" value="_ìå" /> + <ngram occurrences="8" value="_çò" /> + <ngram occurrences="8" value="_åó" /> + <ngram occurrences="8" value="_äå" /> + <ngram occurrences="8" value="_áì" /> + <ngram occurrences="8" value="_áæçá" /> + <ngram occurrences="8" value="_áæç" /> + <ngram occurrences="8" value="_áæ" /> + <ngram occurrences="7" value="þáó" /> + <ngram occurrences="7" value="üôï_" /> + <ngram occurrences="7" value="úõ" /> + <ngram occurrences="7" value="úî" /> + <ngram occurrences="7" value="ù_á" /> + <ngram occurrences="7" value="õò" /> + <ngram occurrences="7" value="õë" /> + <ngram occurrences="7" value="ôù" /> + <ngram occurrences="7" value="ôï_ð" /> +</ngrams> diff --git a/src/plugins/language/russian1.klp b/src/plugins/language/russian1.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="770" value="_" /> + <ngram occurrences="414" value="î" /> + <ngram occurrences="317" value="à" /> + <ngram occurrences="315" value="å" /> + <ngram occurrences="278" value="è" /> + <ngram occurrences="260" value="í" /> + <ngram occurrences="239" value="ò" /> + <ngram occurrences="188" value="ë" /> + <ngram occurrences="185" value="ñ" /> + <ngram occurrences="181" value="â" /> + <ngram occurrences="174" value="ð" /> + <ngram occurrences="135" value="ê" /> + <ngram occurrences="130" value="ä" /> + <ngram occurrences="126" value="ó" /> + <ngram occurrences="118" value="ì" /> + <ngram occurrences="108" value="ï" /> + <ngram occurrences="91" value="î_" /> + <ngram occurrences="83" value="è_" /> + <ngram occurrences="83" value="å_" /> + <ngram occurrences="83" value="à_" /> + <ngram occurrences="79" value="_í" /> + <ngram occurrences="78" value="ü" /> + <ngram occurrences="77" value="_ï" /> + <ngram occurrences="74" value="á" /> + <ngram occurrences="73" value="ÿ" /> + <ngram occurrences="72" value="û" /> + <ngram occurrences="65" value="_â" /> + <ngram occurrences="64" value="ç" /> + <ngram occurrences="60" value="ã" /> + <ngram occurrences="59" value="ü_" /> + <ngram occurrences="59" value="_ñ" /> + <ngram occurrences="58" value="_ò" /> + <ngram occurrences="57" value="_è" /> + <ngram occurrences="54" value="òî" /> + <ngram occurrences="52" value="ñò" /> + <ngram occurrences="46" value="íî" /> + <ngram occurrences="45" value="é" /> + <ngram occurrences="43" value="íà" /> + <ngram occurrences="43" value="_î" /> + <ngram occurrences="42" value="ÿ_" /> + <ngram occurrences="42" value="_ê" /> + <ngram occurrences="41" value="ïî" /> + <ngram occurrences="41" value="îâ" /> + <ngram occurrences="41" value="íå" /> + <ngram occurrences="40" value="ó_" /> + <ngram occurrences="40" value="ë_" /> + <ngram occurrences="40" value="é_" /> + <ngram occurrences="40" value="_ïî" /> + <ngram occurrences="40" value="_ì" /> + <ngram occurrences="40" value="_ä" /> + <ngram occurrences="39" value="ø" /> + <ngram occurrences="38" value="îñ" /> + <ngram occurrences="37" value="åí" /> + <ngram occurrences="37" value="àë" /> + <ngram occurrences="37" value="_è_" /> + <ngram occurrences="36" value="ðà" /> + <ngram occurrences="35" value="õ" /> + <ngram occurrences="35" value="íè" /> + <ngram occurrences="35" value="æ" /> + <ngram occurrences="35" value="_á" /> + <ngram occurrences="34" value="ðî" /> + <ngram occurrences="34" value="êî" /> + <ngram occurrences="33" value="òà" /> + <ngram occurrences="33" value="ì_" /> + <ngram occurrences="33" value="êà" /> + <ngram occurrences="31" value="åð" /> + <ngram occurrences="31" value="äå" /> + <ngram occurrences="31" value="âà" /> + <ngram occurrences="31" value="â_" /> + <ngram occurrences="30" value="ëè" /> + <ngram occurrences="29" value="òî_" /> + <ngram occurrences="29" value="ïð" /> + <ngram occurrences="29" value="åë" /> + <ngram occurrences="29" value="äà" /> + <ngram occurrences="29" value="âî" /> + <ngram occurrences="27" value="îð" /> + <ngram occurrences="27" value="ëî" /> + <ngram occurrences="27" value="ãî" /> + <ngram occurrences="27" value="_íà" /> + <ngram occurrences="26" value="òü" /> + <ngram occurrences="26" value="ò_" /> + <ngram occurrences="26" value="ðè" /> + <ngram occurrences="26" value="àí" /> + <ngram occurrences="26" value="_íå" /> + <ngram occurrences="26" value="_å" /> + <ngram occurrences="25" value="òü_" /> + <ngram occurrences="25" value="òå" /> + <ngram occurrences="25" value="îò" /> + <ngram occurrences="25" value="íó" /> + <ngram occurrences="25" value="ëà" /> + <ngram occurrences="25" value="àê" /> + <ngram occurrences="24" value="û_" /> + <ngram occurrences="24" value="îë" /> + <ngram occurrences="24" value="èë" /> + <ngram occurrences="23" value="îí" /> + <ngram occurrences="23" value="_òî" /> + <ngram occurrences="22" value="îä" /> + <ngram occurrences="22" value="íà_" /> + <ngram occurrences="22" value="ê_" /> + <ngram occurrences="22" value="âå" /> + <ngram occurrences="22" value="àâ" /> + <ngram occurrences="22" value="_ç" /> + <ngram occurrences="22" value="_â_" /> + <ngram occurrences="21" value="íå_" /> + <ngram occurrences="21" value="èò" /> + <ngram occurrences="21" value="åò" /> + <ngram occurrences="21" value="_ïð" /> + <ngram occurrences="20" value="ñå" /> + <ngram occurrences="20" value="åì" /> + <ngram occurrences="20" value="_ó" /> + <ngram occurrences="19" value="þ" /> + <ngram occurrences="19" value="íû" /> + <ngram occurrences="19" value="ìî" /> + <ngram occurrences="19" value="àð" /> + <ngram occurrences="19" value="_òî_" /> + <ngram occurrences="18" value="ñÿ" /> + <ngram occurrences="18" value="îã" /> + <ngram occurrences="18" value="îá" /> + <ngram occurrences="18" value="çà" /> + <ngram occurrences="18" value="æå" /> + <ngram occurrences="18" value="_ð" /> + <ngram occurrences="17" value="ö" /> + <ngram occurrences="17" value="_ã" /> + <ngram occurrences="16" value="ñÿ_" /> + <ngram occurrences="16" value="ðå" /> + <ngram occurrences="16" value="îì" /> + <ngram occurrences="16" value="èí" /> + <ngram occurrences="16" value="èê" /> + <ngram occurrences="16" value="åñ" /> + <ngram occurrences="16" value="âè" /> + <ngram occurrences="16" value="_à" /> + <ngram occurrences="15" value="õ_" /> + <ngram occurrences="15" value="îé" /> + <ngram occurrences="15" value="ìå" /> + <ngram occurrences="15" value="âñ" /> + <ngram occurrences="15" value="áî" /> + <ngram occurrences="15" value="_íà_" /> + <ngram occurrences="15" value="_êî" /> + <ngram occurrences="14" value="óë" /> + <ngram occurrences="14" value="ïå" /> + <ngram occurrences="14" value="îé_" /> + <ngram occurrences="14" value="îå" /> + <ngram occurrences="14" value="ëü" /> + <ngram occurrences="14" value="èç" /> + <ngram occurrences="14" value="åä" /> + <ngram occurrences="14" value="äî" /> + <ngram occurrences="14" value="àò" /> + <ngram occurrences="14" value="_æ" /> + <ngram occurrences="13" value="òð" /> + <ngram occurrences="13" value="ñòà" /> + <ngram occurrences="13" value="ñî" /> + <ngram occurrences="13" value="ñ_" /> + <ngram occurrences="13" value="îñò" /> + <ngram occurrences="13" value="íó_" /> + <ngram occurrences="13" value="ìè" /> + <ngram occurrences="13" value="ëå" /> + <ngram occurrences="13" value="êè" /> + <ngram occurrences="13" value="è_ñ" /> + <ngram occurrences="13" value="äà_" /> + <ngram occurrences="13" value="àë_" /> + <ngram occurrences="13" value="àê_" /> + <ngram occurrences="13" value="_òà" /> + <ngram occurrences="13" value="_íå_" /> + <ngram occurrences="13" value="_çà" /> + <ngram occurrences="12" value="þ_" /> + <ngram occurrences="12" value="ñü_" /> + <ngram occurrences="12" value="ñü" /> + <ngram occurrences="12" value="ñà" /> + <ngram occurrences="12" value="î_í" /> + <ngram occurrences="12" value="íî_" /> + <ngram occurrences="12" value="êó" /> + <ngram occurrences="12" value="èå" /> + <ngram occurrences="12" value="åò_" /> + <ngram occurrences="12" value="åì_" /> + <ngram occurrences="12" value="äè" /> + <ngram occurrences="12" value="äåë" /> + <ngram occurrences="12" value="àñ" /> + <ngram occurrences="12" value="_ñò" /> + <ngram occurrences="12" value="_îñ" /> + <ngram occurrences="12" value="_êà" /> + <ngram occurrences="12" value="_äî" /> + <ngram occurrences="12" value="_âñ" /> + <ngram occurrences="11" value="óò" /> + <ngram occurrences="11" value="òâ" /> + <ngram occurrences="11" value="ïðî" /> + <ngram occurrences="11" value="ìó" /> + <ngram occurrences="11" value="ëè_" /> + <ngram occurrences="11" value="êà_" /> + <ngram occurrences="11" value="èòü" /> + <ngram occurrences="11" value="ãî_" /> + <ngram occurrences="11" value="âñå" /> + <ngram occurrences="11" value="áû" /> + <ngram occurrences="11" value="_ñî" /> + <ngram occurrences="11" value="_âî" /> + <ngram occurrences="11" value="_áû" /> + <ngram occurrences="10" value="ûë" /> + <ngram occurrences="10" value="ûé" /> + <ngram occurrences="10" value="óä" /> + <ngram occurrences="10" value="òè" /> + <ngram occurrences="10" value="òàê" /> + <ngram occurrences="10" value="îì_" /> + <ngram occurrences="10" value="îãî" /> + <ngram occurrences="10" value="î_â" /> + <ngram occurrences="10" value="íí" /> + <ngram occurrences="10" value="èòü_" /> + <ngram occurrences="10" value="èñ" /> + <ngram occurrences="10" value="èë_" /> + <ngram occurrences="10" value="è_ï" /> + <ngram occurrences="10" value="çí" /> + <ngram occurrences="10" value="åã" /> + <ngram occurrences="10" value="áó" /> + <ngram occurrences="10" value="àÿ" /> + <ngram occurrences="10" value="_ÿ" /> + <ngram occurrences="10" value="_òå" /> + <ngram occurrences="10" value="_òàê" /> + <ngram occurrences="10" value="_îò" /> + <ngram occurrences="10" value="_íó_" /> + <ngram occurrences="10" value="_íó" /> + <ngram occurrences="10" value="_ë" /> + <ngram occurrences="10" value="_ãî" /> + <ngram occurrences="9" value="ûé_" /> + <ngram occurrences="9" value="ù" /> + <ngram occurrences="9" value="øè" /> + <ngram occurrences="9" value="øå" /> + <ngram occurrences="9" value="óð" /> + <ngram occurrences="9" value="òû" /> + <ngram occurrences="9" value="òó" /> + <ngram occurrences="9" value="ñòî" /> + <ngram occurrences="9" value="ñê" /> + <ngram occurrences="9" value="ðó" /> + <ngram occurrences="9" value="ðà_" /> + <ngram occurrences="9" value="ïë" /> + <ngram occurrences="9" value="î_ï" /> + <ngram occurrences="9" value="ìà" /> + <ngram occurrences="9" value="ëñÿ_" /> + <ngram occurrences="9" value="ëñÿ" /> + <ngram occurrences="9" value="ëñ" /> + <ngram occurrences="9" value="èé" /> + <ngram occurrences="9" value="èå_" /> + <ngram occurrences="9" value="èâ" /> + <ngram occurrences="9" value="æå_" /> + <ngram occurrences="9" value="åñò" /> + <ngram occurrences="9" value="åíè" /> + <ngram occurrences="9" value="å_â" /> + <ngram occurrences="9" value="äí" /> + <ngram occurrences="9" value="âû" /> + <ngram occurrences="9" value="áûë" /> + <ngram occurrences="9" value="àÿ_" /> + <ngram occurrences="9" value="àø" /> + <ngram occurrences="9" value="àç" /> + <ngram occurrences="9" value="à_í" /> + <ngram occurrences="9" value="à_è" /> + <ngram occurrences="9" value="_íî" /> + <ngram occurrences="9" value="_ìî" /> + <ngram occurrences="9" value="_è_ñ" /> + <ngram occurrences="9" value="_æå" /> + <ngram occurrences="9" value="_äà" /> + <ngram occurrences="9" value="_âñå" /> + <ngram occurrences="9" value="_áûë" /> + <ngram occurrences="9" value="_áó" /> + <ngram occurrences="8" value="ÿ_í" /> + <ngram occurrences="8" value="õî" /> + <ngram occurrences="8" value="ó_í" /> + <ngram occurrences="8" value="òû_" /> + <ngram occurrences="8" value="òñ" /> + <ngram occurrences="8" value="òåë" /> + <ngram occurrences="8" value="ñòð" /> + <ngram occurrences="8" value="ñï" /> + <ngram occurrences="8" value="ðü" /> + <ngram occurrences="8" value="ðû" /> + <ngram occurrences="8" value="ïðè" /> + <ngram occurrences="8" value="ïî_" /> + <ngram occurrences="8" value="ïåð" /> + <ngram occurrences="8" value="îæ" /> + <ngram occurrences="8" value="îå_" /> + <ngram occurrences="8" value="îâî" /> + <ngram occurrences="8" value="î_ì" /> + <ngram occurrences="8" value="íü" /> + <ngram occurrences="8" value="íò" /> + <ngram occurrences="8" value="ëîñ" /> + <ngram occurrences="8" value="ëà_" /> + <ngram occurrences="8" value="êàê" /> + <ngram occurrences="8" value="èì" /> + <ngram occurrences="8" value="èä" /> + <ngram occurrences="8" value="è_è" /> + <ngram occurrences="8" value="è_ä" /> + <ngram occurrences="8" value="åé" /> + <ngram occurrences="8" value="åç" /> + <ngram occurrences="8" value="å_î" /> + <ngram occurrences="8" value="å_í" /> + <ngram occurrences="8" value="âîð" /> + <ngram occurrences="8" value="àíè" /> + <ngram occurrences="8" value="àì" /> + <ngram occurrences="8" value="_ðà" /> + <ngram occurrences="8" value="_ïðî" /> + <ngram occurrences="8" value="_ïî_" /> + <ngram occurrences="8" value="_ìè" /> + <ngram occurrences="8" value="_êàê" /> + <ngram occurrences="8" value="_äå" /> + <ngram occurrences="7" value="ü_ñ" /> + <ngram occurrences="7" value="ûå_" /> + <ngram occurrences="7" value="ûå" /> + <ngram occurrences="7" value="öè" /> + <ngram occurrences="7" value="óá" /> + <ngram occurrences="7" value="ó_è" /> + <ngram occurrences="7" value="òîð" /> + <ngram occurrences="7" value="òíî" /> + <ngram occurrences="7" value="òí" /> + <ngram occurrences="7" value="ïðà" /> + <ngram occurrences="7" value="ïîë" /> + <ngram occurrences="7" value="îâîð" /> + <ngram occurrences="7" value="îâà" /> + <ngram occurrences="7" value="îâ_" /> + <ngram occurrences="7" value="î_ò" /> + <ngram occurrences="7" value="î_ñ" /> + <ngram occurrences="7" value="î_íå" /> + <ngram occurrences="7" value="íûé_" /> + <ngram occurrences="7" value="íûé" /> + <ngram occurrences="7" value="íóë" /> + <ngram occurrences="7" value="íîé_" /> + <ngram occurrences="7" value="íîé" /> + <ngram occurrences="7" value="íîâ" /> + <ngram occurrences="7" value="í_" /> + <ngram occurrences="7" value="ìó_" /> + <ngram occurrences="7" value="ìí" /> + <ngram occurrences="7" value="ëî_" /> + <ngram occurrences="7" value="ë_ò" /> + <ngram occurrences="7" value="êò" /> + <ngram occurrences="7" value="êàê_" /> + <ngram occurrences="7" value="èé_" /> + <ngram occurrences="7" value="èè_" /> + <ngram occurrences="7" value="èè" /> + <ngram occurrences="7" value="è_è_" /> + <ngram occurrences="7" value="è_â" /> + <ngram occurrences="7" value="æè" /> + <ngram occurrences="7" value="æåí" /> + <ngram occurrences="7" value="åðå" /> + <ngram occurrences="7" value="åíí" /> + <ngram occurrences="7" value="åë_" /> + <ngram occurrences="7" value="åé_" /> + <ngram occurrences="7" value="å_ò" /> + <ngram occurrences="7" value="å_ä" /> + <ngram occurrences="7" value="ãîâîð" /> + <ngram occurrences="7" value="ãîâî" /> + <ngram occurrences="7" value="ãîâ" /> + <ngram occurrences="7" value="âàë" /> + <ngram occurrences="7" value="áð" /> + <ngram occurrences="7" value="àä" /> + <ngram occurrences="7" value="àâà" /> + <ngram occurrences="7" value="à_î" /> + <ngram occurrences="7" value="à_è_" /> + <ngram occurrences="7" value="à_ä" /> + <ngram occurrences="7" value="_ÿ_" /> + <ngram occurrences="7" value="_ñòà" /> + <ngram occurrences="7" value="_ïðè" /> + <ngram occurrences="7" value="_ïîë" /> + <ngram occurrences="7" value="_íè" /> + <ngram occurrences="7" value="_ìí" /> + <ngram occurrences="7" value="_êàê_" /> + <ngram occurrences="7" value="_âû" /> + <ngram occurrences="6" value="ÿ_ï" /> + <ngram occurrences="6" value="ýòî" /> + <ngram occurrences="6" value="ýò" /> + <ngram occurrences="6" value="ý" /> + <ngram occurrences="6" value="ü_î" /> + <ngram occurrences="6" value="ü_í" /> + <ngram occurrences="6" value="ü_â" /> + <ngram occurrences="6" value="ü_á" /> + <ngram occurrences="6" value="û_í" /> + <ngram occurrences="6" value="øê" /> + <ngram occurrences="6" value="óæ" /> + <ngram occurrences="6" value="ñòâ" /> + <ngram occurrences="6" value="ñîâ" /> + <ngram occurrences="6" value="ñè" /> + <ngram occurrences="6" value="ñåì" /> + <ngram occurrences="6" value="ðü_" /> + <ngram occurrences="6" value="ðîä" /> + <ngram occurrences="6" value="ðèò" /> + <ngram occurrences="6" value="îø" /> + <ngram occurrences="6" value="îòî" /> + <ngram occurrences="6" value="îñü_" /> + <ngram occurrences="6" value="îñü" /> + <ngram occurrences="6" value="îðî" /> + <ngram occurrences="6" value="îï" /> + <ngram occurrences="6" value="îäí" /> + <ngram occurrences="6" value="îäè" /> + <ngram occurrences="6" value="îãî_" /> + <ngram occurrences="6" value="î_ïî" /> + <ngram occurrences="6" value="íÿ" /> + <ngram occurrences="6" value="íûå_" /> + <ngram occurrences="6" value="íûå" /> + <ngram occurrences="6" value="íîã" /> + <ngram occurrences="6" value="ííû" /> + <ngram occurrences="6" value="ìíå_" /> + <ngram occurrences="6" value="ìíå" /> + <ngram occurrences="6" value="ì_ï" /> + <ngram occurrences="6" value="ëÿ" /> + <ngram occurrences="6" value="ëîñü_" /> + <ngram occurrences="6" value="ëîñü" /> + <ngram occurrences="6" value="ë_òî_" /> +</ngrams> diff --git a/src/plugins/language/russian2.klp b/src/plugins/language/russian2.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="760" value="_" /> + <ngram occurrences="379" value="þ" /> + <ngram occurrences="360" value="õ" /> + <ngram occurrences="272" value="ø" /> + <ngram occurrences="264" value="â" /> + <ngram occurrences="242" value="ý" /> + <ngram occurrences="237" value="ð" /> + <ngram occurrences="183" value="ò" /> + <ngram occurrences="172" value="à" /> + <ngram occurrences="170" value="á" /> + <ngram occurrences="142" value="û" /> + <ngram occurrences="120" value="ü" /> + <ngram occurrences="120" value="ã" /> + <ngram occurrences="117" value="ú" /> + <ngram occurrences="99" value="ô" /> + <ngram occurrences="99" value="ß" /> + <ngram occurrences="96" value="ø_" /> + <ngram occurrences="95" value="ï" /> + <ngram occurrences="93" value="õ_" /> + <ngram occurrences="83" value="þ_" /> + <ngram occurrences="82" value="ë" /> + <ngram occurrences="71" value="_ò" /> + <ngram occurrences="68" value="ï_" /> + <ngram occurrences="62" value="ó" /> + <ngram occurrences="61" value="ð_" /> + <ngram occurrences="61" value="_ý" /> + <ngram occurrences="60" value="_ß" /> + <ngram occurrences="59" value="ì" /> + <ngram occurrences="55" value="ç" /> + <ngram occurrences="54" value="_ø" /> + <ngram occurrences="53" value="áâ" /> + <ngram occurrences="52" value="_á" /> + <ngram occurrences="51" value="þò" /> + <ngram occurrences="51" value="ñ" /> + <ngram occurrences="51" value="âþ" /> + <ngram occurrences="49" value="_â" /> + <ngram occurrences="48" value="ù" /> + <ngram occurrences="47" value="ýþ" /> + <ngram occurrences="47" value="ýõ" /> + <ngram occurrences="47" value="õý" /> + <ngram occurrences="46" value="ù_" /> + <ngram occurrences="44" value="_þ" /> + <ngram occurrences="40" value="_ø_" /> + <ngram occurrences="39" value="óþ" /> + <ngram occurrences="38" value="ë_" /> + <ngram occurrences="37" value="õà" /> + <ngram occurrences="37" value="_ü" /> + <ngram occurrences="37" value="_ô" /> + <ngram occurrences="35" value="ö" /> + <ngram occurrences="34" value="ýø" /> + <ngram occurrences="34" value="àþ" /> + <ngram occurrences="34" value="_ú" /> + <ngram occurrences="33" value="ã_" /> + <ngram occurrences="33" value="âð" /> + <ngram occurrences="32" value="ò_" /> + <ngram occurrences="32" value="ì_" /> + <ngram occurrences="32" value="è" /> + <ngram occurrences="31" value="ýð" /> + <ngram occurrences="31" value="âõ" /> + <ngram occurrences="30" value="ü_" /> + <ngram occurrences="28" value="òð" /> + <ngram occurrences="28" value="å" /> + <ngram occurrences="28" value="â_" /> + <ngram occurrences="28" value="àõ" /> + <ngram occurrences="27" value="þà" /> + <ngram occurrences="27" value="úþ" /> + <ngram occurrences="27" value="òõ" /> + <ngram occurrences="27" value="ðý" /> + <ngram occurrences="27" value="_ýõ" /> + <ngram occurrences="26" value="þû" /> + <ngram occurrences="26" value="þâ" /> + <ngram occurrences="26" value="ûø" /> + <ngram occurrences="26" value="úð" /> + <ngram occurrences="26" value="õâ" /> + <ngram occurrences="26" value="àð" /> + <ngram occurrences="25" value="ýõ_" /> + <ngram occurrences="25" value="üõ" /> + <ngram occurrences="25" value="ûþ" /> + <ngram occurrences="25" value="âø" /> + <ngram occurrences="25" value="àø" /> + <ngram occurrences="25" value="ßþ" /> + <ngram occurrences="24" value="ú_" /> + <ngram occurrences="24" value="õá" /> + <ngram occurrences="24" value="ßà" /> + <ngram occurrences="24" value="_ã" /> + <ngram occurrences="23" value="þý" /> + <ngram occurrences="23" value="ûì" /> + <ngram occurrences="23" value="óþ_" /> + <ngram occurrences="23" value="_ñ" /> + <ngram occurrences="22" value="þù" /> + <ngram occurrences="22" value="øâ" /> + <ngram occurrences="22" value="æ" /> + <ngram occurrences="21" value="þù_" /> + <ngram occurrences="21" value="òþ" /> + <ngram occurrences="21" value="òë" /> + <ngram occurrences="21" value="ðú" /> + <ngram occurrences="21" value="çõ" /> + <ngram occurrences="21" value="âã" /> + <ngram occurrences="20" value="þô" /> + <ngram occurrences="20" value="õü" /> + <ngram occurrences="20" value="òá" /> + <ngram occurrences="20" value="_ï" /> + <ngram occurrences="20" value="_à" /> + <ngram occurrences="20" value="_ßþ" /> + <ngram occurrences="19" value="ûõ" /> + <ngram occurrences="19" value="ôõ" /> + <ngram occurrences="19" value="ðû" /> + <ngram occurrences="19" value="âþ_" /> + <ngram occurrences="19" value="_ßà" /> + <ngram occurrences="18" value="ðâ" /> + <ngram occurrences="18" value="_ýð" /> + <ngram occurrences="18" value="_òë" /> + <ngram occurrences="18" value="_ð" /> + <ngram occurrences="18" value="_ç" /> + <ngram occurrences="17" value="þü" /> + <ngram occurrences="17" value="þó" /> + <ngram occurrences="17" value="üþ" /> + <ngram occurrences="17" value="öõ" /> + <ngram occurrences="17" value="ôþ" /> + <ngram occurrences="17" value="áõ" /> + <ngram occurrences="17" value="_ýõ_" /> + <ngram occurrences="17" value="_ó" /> + <ngram occurrences="17" value="_òá" /> + <ngram occurrences="17" value="_ï_" /> + <ngram occurrences="16" value="þá" /> + <ngram occurrences="16" value="øý" /> + <ngram occurrences="16" value="õû" /> + <ngram occurrences="16" value="õô" /> + <ngram occurrences="16" value="õó" /> + <ngram occurrences="16" value="ôð" /> + <ngram occurrences="16" value="î" /> + <ngram occurrences="16" value="âì" /> + <ngram occurrences="16" value="áï" /> + <ngram occurrences="15" value="¸" /> + <ngram occurrences="15" value="üø" /> + <ngram occurrences="15" value="ûø_" /> + <ngram occurrences="15" value="û_" /> + <ngram occurrences="15" value="øï" /> + <ngram occurrences="15" value="ðú_" /> + <ngram occurrences="15" value="âë" /> + <ngram occurrences="15" value="âà" /> + <ngram occurrences="15" value="áû" /> + <ngram occurrences="15" value="àã" /> + <ngram occurrences="15" value="_¸" /> + <ngram occurrences="15" value="_õ" /> + <ngram occurrences="15" value="_ò_" /> + <ngram occurrences="14" value="þò_" /> + <ngram occurrences="14" value="øü" /> + <ngram occurrences="14" value="øò" /> + <ngram occurrences="14" value="øï_" /> + <ngram occurrences="14" value="õóþ" /> + <ngram occurrences="14" value="òáõ" /> + <ngram occurrences="14" value="ßõ" /> + <ngram occurrences="14" value="_úð" /> + <ngram occurrences="14" value="_òáõ" /> + <ngram occurrences="14" value="_áâ" /> + <ngram occurrences="13" value="þòð" /> + <ngram occurrences="13" value="ýþ_" /> + <ngram occurrences="13" value="ýë" /> + <ngram occurrences="13" value="ýã" /> + <ngram occurrences="13" value="úø" /> + <ngram occurrences="13" value="õ_ß" /> + <ngram occurrences="13" value="é" /> + <ngram occurrences="13" value="å_" /> + <ngram occurrences="13" value="ãâ" /> + <ngram occurrences="13" value="áï_" /> + <ngram occurrences="13" value="_úþ" /> + <ngram occurrences="13" value="__" /> + <ngram occurrences="12" value="þóþ" /> + <ngram occurrences="12" value="ýý" /> + <ngram occurrences="12" value="ýð_" /> + <ngram occurrences="12" value="ø_á" /> + <ngram occurrences="12" value="õóþ_" /> + <ngram occurrences="12" value="õâ_" /> + <ngram occurrences="12" value="ðò" /> + <ngram occurrences="12" value="âì_" /> + <ngram occurrences="12" value="âë_" /> + <ngram occurrences="12" value="áþ" /> + <ngram occurrences="12" value="áõ_" /> + <ngram occurrences="12" value="áâð" /> + <ngram occurrences="12" value="___" /> + <ngram occurrences="11" value="þñ" /> + <ngram occurrences="11" value="þàø" /> + <ngram occurrences="11" value="ýøï_" /> + <ngram occurrences="11" value="ýøï" /> + <ngram occurrences="11" value="ûìý" /> + <ngram occurrences="11" value="úðú" /> + <ngram occurrences="11" value="øà" /> + <ngram occurrences="11" value="ø_ò" /> + <ngram occurrences="11" value="õ_ò" /> + <ngram occurrences="11" value="òáõ_" /> + <ngram occurrences="11" value="ìý" /> + <ngram occurrences="11" value="çø" /> + <ngram occurrences="11" value="çâ" /> + <ngram occurrences="11" value="âò" /> + <ngram occurrences="11" value="áâà" /> + <ngram occurrences="11" value="àþò" /> + <ngram occurrences="11" value="ßø" /> + <ngram occurrences="11" value="ßàþ" /> + <ngram occurrences="11" value="_üþ" /> + <ngram occurrences="11" value="_òáõ_" /> + <ngram occurrences="11" value="_âõ" /> + <ngram occurrences="11" value="____" /> + <ngram occurrences="10" value="½" /> + <ngram occurrences="10" value="þûì" /> + <ngram occurrences="10" value="þóþ_" /> + <ngram occurrences="10" value="þ_ý" /> + <ngram occurrences="10" value="ýæ" /> + <ngram occurrences="10" value="ûð" /> + <ngram occurrences="10" value="ûìýþ" /> + <ngram occurrences="10" value="úðú_" /> + <ngram occurrences="10" value="øû" /> + <ngram occurrences="10" value="øú" /> + <ngram occurrences="10" value="øù_" /> + <ngram occurrences="10" value="øù" /> + <ngram occurrences="10" value="øá" /> + <ngram occurrences="10" value="õýø" /> + <ngram occurrences="10" value="õü_" /> + <ngram occurrences="10" value="õú" /> + <ngram occurrences="10" value="òû" /> + <ngram occurrences="10" value="î_" /> + <ngram occurrences="10" value="í" /> + <ngram occurrences="10" value="ìýþ" /> + <ngram occurrences="10" value="çâþ" /> + <ngram occurrences="10" value="æõ" /> + <ngram occurrences="10" value="âõà" /> + <ngram occurrences="10" value="áú" /> + <ngram occurrences="10" value="àõô" /> + <ngram occurrences="10" value="_½" /> + <ngram occurrences="10" value="_úðú_" /> + <ngram occurrences="10" value="_úðú" /> + <ngram occurrences="10" value="_ôþ" /> + <ngram occurrences="10" value="_í" /> + <ngram occurrences="10" value="_çâþ" /> + <ngram occurrences="10" value="_çâ" /> + <ngram occurrences="10" value="_âþ" /> + <ngram occurrences="10" value="_áþ" /> + <ngram occurrences="10" value="_____" /> + <ngram occurrences="9" value="þûþ" /> + <ngram occurrences="9" value="þòþ" /> + <ngram occurrences="9" value="þòðý" /> + <ngram occurrences="9" value="þ_þ" /> + <ngram occurrences="9" value="ý_" /> + <ngram occurrences="9" value="üð" /> + <ngram occurrences="9" value="ûõý" /> + <ngram occurrences="9" value="úâ" /> + <ngram occurrences="9" value="øç" /> + <ngram occurrences="9" value="ø_ý" /> + <ngram occurrences="9" value="õç" /> + <ngram occurrences="9" value="õáâ" /> + <ngram occurrences="9" value="ô_" /> + <ngram occurrences="9" value="òðý" /> + <ngram occurrences="9" value="ñõ" /> + <ngram occurrences="9" value="ñë" /> + <ngram occurrences="9" value="èø" /> + <ngram occurrences="9" value="èõ" /> + <ngram occurrences="9" value="ãû" /> + <ngram occurrences="9" value="ãà" /> + <ngram occurrences="9" value="àð_" /> + <ngram occurrences="9" value="ßõà" /> + <ngram occurrences="9" value="_þâ" /> + <ngram occurrences="9" value="_üõ" /> + <ngram occurrences="9" value="_û" /> + <ngram occurrences="9" value="_ö" /> + <ngram occurrences="9" value="_óþ" /> + <ngram occurrences="9" value="_âð" /> + <ngram occurrences="8" value="þö" /> + <ngram occurrences="8" value="üý" /> + <ngram occurrences="8" value="ûï" /> + <ngram occurrences="8" value="úþý" /> + <ngram occurrences="8" value="ù_ß" /> + <ngram occurrences="8" value="øõ" /> + <ngram occurrences="8" value="øçõ" /> + <ngram occurrences="8" value="õàõ" /> + <ngram occurrences="8" value="õ_â" /> + <ngram occurrences="8" value="ôã" /> + <ngram occurrences="8" value="ðï_" /> + <ngram occurrences="8" value="ðï" /> + <ngram occurrences="8" value="ð_ý" /> + <ngram occurrences="8" value="ð_ò" /> + <ngram occurrences="8" value="ï_ò" /> + <ngram occurrences="8" value="çâþ_" /> + <ngram occurrences="8" value="æø" /> + <ngram occurrences="8" value="ä" /> + <ngram occurrences="8" value="âø_" /> + <ngram occurrences="8" value="âõ_" /> + <ngram occurrences="8" value="âðú" /> + <ngram occurrences="8" value="àë" /> + <ngram occurrences="8" value="_ýø" /> + <ngram occurrences="8" value="_úþý" /> + <ngram occurrences="8" value="_òõ" /> + <ngram occurrences="8" value="_çâþ_" /> + <ngram occurrences="8" value="_ã_" /> + <ngram occurrences="8" value="_âë_" /> + <ngram occurrences="8" value="_âë" /> + <ngram occurrences="8" value="_àð" /> + <ngram occurrences="8" value="_ßàþ" /> + <ngram occurrences="7" value="þü_" /> + <ngram occurrences="7" value="þõ" /> + <ngram occurrences="7" value="þè" /> + <ngram occurrences="7" value="þâþ" /> + <ngram occurrences="7" value="þ_ò" /> + <ngram occurrences="7" value="þ_â" /> + <ngram occurrences="7" value="þ_ß" /> + <ngram occurrences="7" value="ýþù_" /> + <ngram occurrences="7" value="ýþù" /> + <ngram occurrences="7" value="ýýþ" /> + <ngram occurrences="7" value="ýï" /> + <ngram occurrences="7" value="üõý" /> + <ngram occurrences="7" value="ûþò" /> + <ngram occurrences="7" value="úø_" /> + <ngram occurrences="7" value="øå" /> + <ngram occurrences="7" value="ø_â" /> + <ngram occurrences="7" value="õò" /> + <ngram occurrences="7" value="õß" /> + <ngram occurrences="7" value="õ_ã" /> + <ngram occurrences="7" value="óþò" /> + <ngram occurrences="7" value="òð_" /> + <ngram occurrences="7" value="òë_" /> + <ngram occurrences="7" value="ðýø" /> + <ngram occurrences="7" value="ðûìýþ" /> + <ngram occurrences="7" value="ðûìý" /> + <ngram occurrences="7" value="ðûì" /> + <ngram occurrences="7" value="ðè" /> + <ngram occurrences="7" value="ï_ß" /> + <ngram occurrences="7" value="åþ" /> + <ngram occurrences="7" value="ãü" /> + <ngram occurrences="7" value="áâø" /> + <ngram occurrences="7" value="á_" /> + <ngram occurrences="7" value="àþòð" /> + <ngram occurrences="7" value="²" /> + <ngram occurrences="7" value="_ôõ" /> + <ngram occurrences="7" value="_ôð" /> + <ngram occurrences="7" value="_ñõ" /> + <ngram occurrences="7" value="_âðú" /> + <ngram occurrences="7" value="_âã" /> + <ngram occurrences="7" value="_àõ" /> + <ngram occurrences="7" value="_ßõà" /> + <ngram occurrences="7" value="_ßõ" /> + <ngram occurrences="7" value="_²" /> + <ngram occurrences="6" value="¸_" /> + <ngram occurrences="6" value="þýæõß" /> + <ngram occurrences="6" value="þýæõ" /> + <ngram occurrences="6" value="þýæ" /> + <ngram occurrences="6" value="þöõ" /> + <ngram occurrences="6" value="þõ_" /> + <ngram occurrences="6" value="þáâ" /> + <ngram occurrences="6" value="þ_ü" /> + <ngram occurrences="6" value="þ_ø" /> + <ngram occurrences="6" value="ýþò" /> + <ngram occurrences="6" value="ýæõßâ" /> + <ngram occurrences="6" value="ýæõß" /> + <ngram occurrences="6" value="ýæõ" /> + <ngram occurrences="6" value="ýâ" /> + <ngram occurrences="6" value="üë" /> + <ngram occurrences="6" value="üã_" /> + <ngram occurrences="6" value="üã" /> + <ngram occurrences="6" value="ü_â" /> + <ngram occurrences="6" value="ûìýþ_" /> + <ngram occurrences="6" value="úþýæõ" /> + <ngram occurrences="6" value="úþýæ" /> + <ngram occurrences="6" value="øø_" /> + <ngram occurrences="6" value="øø" /> + <ngram occurrences="6" value="øå_" /> + <ngram occurrences="6" value="øâõ" /> + <ngram occurrences="6" value="øàþòð" /> + <ngram occurrences="6" value="øàþò" /> + <ngram occurrences="6" value="øàþ" /> + <ngram occurrences="6" value="ø_ü" /> + <ngram occurrences="6" value="ø_ø" /> + <ngram occurrences="6" value="ø_ß" /> + <ngram occurrences="6" value="öø" /> + <ngram occurrences="6" value="öõ_" /> + <ngram occurrences="6" value="õýý" /> + <ngram occurrences="6" value="õýøï_" /> + <ngram occurrences="6" value="õýøï" /> + <ngram occurrences="6" value="õýõ" /> + <ngram occurrences="6" value="õýâ" /> + <ngram occurrences="6" value="õù_" /> + <ngram occurrences="6" value="õù" /> + <ngram occurrences="6" value="õè" /> + <ngram occurrences="6" value="õßâãð" /> + <ngram occurrences="6" value="õßâã" /> + <ngram occurrences="6" value="õßâ" /> + <ngram occurrences="6" value="õ_þ" /> + <ngram occurrences="6" value="õ_òë" /> + <ngram occurrences="6" value="õ_ßþ" /> + <ngram occurrences="6" value="òþà" /> + <ngram occurrences="6" value="òþ_" /> + <ngram occurrences="6" value="òý" /> + <ngram occurrences="6" value="òûõ" /> + <ngram occurrences="6" value="òø" /> + <ngram occurrences="6" value="ðü" /> + <ngram occurrences="6" value="ðõ" /> + <ngram occurrences="6" value="ðñ" /> + <ngram occurrences="6" value="ðâì" /> + <ngram occurrences="6" value="ðá" /> + <ngram occurrences="6" value="ïâ" /> + <ngram occurrences="6" value="ï_á" /> + <ngram occurrences="6" value="ìýþ_" /> +</ngrams> diff --git a/src/plugins/language/sanskrit.klp b/src/plugins/language/sanskrit.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1209" value="a" /> + <ngram occurrences="477" value="_" /> + <ngram occurrences="350" value="h" /> + <ngram occurrences="283" value="i" /> + <ngram occurrences="232" value="n" /> + <ngram occurrences="222" value="t" /> + <ngram occurrences="192" value="m" /> + <ngram occurrences="189" value="r" /> + <ngram occurrences="186" value="aa" /> + <ngram occurrences="185" value="s" /> + <ngram occurrences="177" value="a_" /> + <ngram occurrences="154" value="ha" /> + <ngram occurrences="136" value="d" /> + <ngram occurrences="134" value="am" /> + <ngram occurrences="130" value="v" /> + <ngram occurrences="123" value="y" /> + <ngram occurrences="122" value="na" /> + <ngram occurrences="120" value="an" /> + <ngram occurrences="108" value="e" /> + <ngram occurrences="100" value="ya" /> + <ngram occurrences="98" value="u" /> + <ngram occurrences="96" value="ar" /> + <ngram occurrences="95" value="ta" /> + <ngram occurrences="92" value="va" /> + <ngram occurrences="90" value="p" /> + <ngram occurrences="87" value="ra" /> + <ngram occurrences="79" value="ma" /> + <ngram occurrences="78" value="at" /> + <ngram occurrences="76" value="k" /> + <ngram occurrences="74" value="sh" /> + <ngram occurrences="70" value="_n" /> + <ngram occurrences="67" value="m_" /> + <ngram occurrences="66" value="ana" /> + <ngram occurrences="64" value="ah" /> + <ngram occurrences="61" value="i_" /> + <ngram occurrences="61" value="as" /> + <ngram occurrences="60" value="am_" /> + <ngram occurrences="59" value="o" /> + <ngram occurrences="59" value="g" /> + <ngram occurrences="55" value="h_" /> + <ngram occurrences="54" value="ad" /> + <ngram occurrences="52" value="b" /> + <ngram occurrences="51" value="_s" /> + <ngram occurrences="49" value="pa" /> + <ngram occurrences="49" value="c" /> + <ngram occurrences="48" value="da" /> + <ngram occurrences="47" value="aan" /> + <ngram occurrences="45" value="e_" /> + <ngram occurrences="44" value="j" /> + <ngram occurrences="44" value="ama" /> + <ngram occurrences="43" value="hi" /> + <ngram occurrences="43" value="ch" /> + <ngram occurrences="40" value="it" /> + <ngram occurrences="40" value="ara" /> + <ngram occurrences="39" value="sa" /> + <ngram occurrences="39" value="na_" /> + <ngram occurrences="39" value="dh" /> + <ngram occurrences="38" value="ay" /> + <ngram occurrences="37" value="av" /> + <ngram occurrences="37" value="aa_" /> + <ngram occurrences="35" value="a_n" /> + <ngram occurrences="35" value="_na" /> + <ngram occurrences="34" value="ka" /> + <ngram occurrences="33" value="sha" /> + <ngram occurrences="33" value="l" /> + <ngram occurrences="33" value="ja" /> + <ngram occurrences="32" value="_p" /> + <ngram occurrences="32" value="_h" /> + <ngram occurrences="31" value="is" /> + <ngram occurrences="31" value="ii" /> + <ngram occurrences="31" value="bh" /> + <ngram occurrences="29" value="ti" /> + <ngram occurrences="29" value="ap" /> + <ngram occurrences="29" value="ah_" /> + <ngram occurrences="28" value="ni" /> + <ngram occurrences="28" value="ga" /> + <ngram occurrences="27" value="nam" /> + <ngram occurrences="27" value="ha_" /> + <ngram occurrences="27" value="aya" /> + <ngram occurrences="27" value="_g" /> + <ngram occurrences="27" value="_b" /> + <ngram occurrences="26" value="ata" /> + <ngram occurrences="26" value="ai" /> + <ngram occurrences="25" value="aha" /> + <ngram occurrences="25" value="aana" /> + <ngram occurrences="25" value="_v" /> + <ngram occurrences="25" value="_t" /> + <ngram occurrences="25" value="_a" /> + <ngram occurrences="24" value="la" /> + <ngram occurrences="24" value="_j" /> + <ngram occurrences="23" value="vi" /> + <ngram occurrences="23" value="di" /> + <ngram occurrences="23" value="ava" /> + <ngram occurrences="23" value="_d" /> + <ngram occurrences="22" value="st" /> + <ngram occurrences="22" value="ri" /> + <ngram occurrences="22" value="ish" /> + <ngram occurrences="22" value="al" /> + <ngram occurrences="22" value="ak" /> + <ngram occurrences="22" value="_sa" /> + <ngram occurrences="22" value="_k" /> + <ngram occurrences="21" value="yaa" /> + <ngram occurrences="21" value="vaa" /> + <ngram occurrences="21" value="ham" /> + <ngram occurrences="21" value="haa" /> + <ngram occurrences="21" value="_h_" /> + <ngram occurrences="20" value="o_" /> + <ngram occurrences="20" value="ag" /> + <ngram occurrences="20" value="_m" /> + <ngram occurrences="19" value="th" /> + <ngram occurrences="19" value="ita" /> + <ngram occurrences="19" value="hh" /> + <ngram occurrences="19" value="es" /> + <ngram occurrences="19" value="_ja" /> + <ngram occurrences="19" value="_ch" /> + <ngram occurrences="19" value="_c" /> + <ngram occurrences="18" value="ya_" /> + <ngram occurrences="18" value="taa" /> + <ngram occurrences="18" value="esh" /> + <ngram occurrences="18" value="ala" /> + <ngram occurrences="17" value="tha" /> + <ngram occurrences="17" value="ram" /> + <ngram occurrences="17" value="maa" /> + <ngram occurrences="17" value="in" /> + <ngram occurrences="17" value="dha" /> + <ngram occurrences="17" value="chi" /> + <ngram occurrences="17" value="cha" /> + <ngram occurrences="17" value="bha" /> + <ngram occurrences="17" value="_na_" /> + <ngram occurrences="16" value="x" /> + <ngram occurrences="16" value="tva" /> + <ngram occurrences="16" value="tv" /> + <ngram occurrences="16" value="pr" /> + <ngram occurrences="16" value="nd" /> + <ngram occurrences="16" value="naa" /> + <ngram occurrences="16" value="me" /> + <ngram occurrences="16" value="id" /> + <ngram occurrences="16" value="har" /> + <ngram occurrences="16" value="ana_" /> + <ngram occurrences="16" value="adh" /> + <ngram occurrences="16" value="_y" /> + <ngram occurrences="16" value="_pa" /> + <ngram occurrences="15" value="shh" /> + <ngram occurrences="15" value="ik" /> + <ngram occurrences="15" value="ada" /> + <ngram occurrences="14" value="yat" /> + <ngram occurrences="14" value="vam" /> + <ngram occurrences="14" value="te" /> + <ngram occurrences="14" value="tas" /> + <ngram occurrences="14" value="sya" /> + <ngram occurrences="14" value="sy" /> + <ngram occurrences="14" value="pra" /> + <ngram occurrences="14" value="paa" /> + <ngram occurrences="14" value="n_" /> + <ngram occurrences="14" value="ham_" /> + <ngram occurrences="14" value="ati" /> + <ngram occurrences="14" value="ash" /> + <ngram occurrences="14" value="ani" /> + <ngram occurrences="14" value="aka" /> + <ngram occurrences="14" value="a_j" /> + <ngram occurrences="14" value="_ya" /> + <ngram occurrences="14" value="_nam" /> + <ngram occurrences="14" value="_i" /> + <ngram occurrences="13" value="yam" /> + <ngram occurrences="13" value="uu" /> + <ngram occurrences="13" value="ta_" /> + <ngram occurrences="13" value="su" /> + <ngram occurrences="13" value="sta" /> + <ngram occurrences="13" value="ru" /> + <ngram occurrences="13" value="ra_" /> + <ngram occurrences="13" value="ir" /> + <ngram occurrences="13" value="hya" /> + <ngram occurrences="13" value="hy" /> + <ngram occurrences="13" value="hav" /> + <ngram occurrences="13" value="esha" /> + <ngram occurrences="13" value="asya" /> + <ngram occurrences="13" value="asy" /> + <ngram occurrences="13" value="anaa" /> + <ngram occurrences="13" value="aam" /> + <ngram occurrences="13" value="aad" /> + <ngram occurrences="13" value="_ma" /> + <ngram occurrences="13" value="_bh" /> + <ngram occurrences="12" value="va_" /> + <ngram occurrences="12" value="re" /> + <ngram occurrences="12" value="r_i" /> + <ngram occurrences="12" value="r_" /> + <ngram occurrences="12" value="par" /> + <ngram occurrences="12" value="nda" /> + <ngram occurrences="12" value="nama" /> + <ngram occurrences="12" value="m_h" /> + <ngram occurrences="12" value="eva" /> + <ngram occurrences="12" value="ev" /> + <ngram occurrences="12" value="daa" /> + <ngram occurrences="12" value="ast" /> + <ngram occurrences="12" value="anam" /> + <ngram occurrences="12" value="aj" /> + <ngram occurrences="12" value="aga" /> + <ngram occurrences="12" value="ab" /> + <ngram occurrences="12" value="aah" /> + <ngram occurrences="12" value="a_m" /> + <ngram occurrences="12" value="a_ja" /> + <ngram occurrences="12" value="a_ch" /> + <ngram occurrences="12" value="a_c" /> + <ngram occurrences="12" value="a_b" /> + <ngram occurrences="12" value="_sh" /> + <ngram occurrences="12" value="_ga" /> + <ngram occurrences="11" value="ye" /> + <ngram occurrences="11" value="var" /> + <ngram occurrences="11" value="ur" /> + <ngram occurrences="11" value="tr" /> + <ngram occurrences="11" value="sar" /> + <ngram occurrences="11" value="rt" /> + <ngram occurrences="11" value="om" /> + <ngram occurrences="11" value="mi" /> + <ngram occurrences="11" value="m_h_" /> + <ngram occurrences="11" value="iv" /> + <ngram occurrences="11" value="han" /> + <ngram occurrences="11" value="ax" /> + <ngram occurrences="11" value="asta" /> + <ngram occurrences="11" value="ari" /> + <ngram occurrences="11" value="am_h_" /> + <ngram occurrences="11" value="am_h" /> + <ngram occurrences="11" value="aham" /> + <ngram occurrences="11" value="adi" /> + <ngram occurrences="11" value="aay" /> + <ngram occurrences="11" value="a_v" /> + <ngram occurrences="11" value="a_s" /> + <ngram occurrences="11" value="a_k" /> + <ngram occurrences="11" value="_vi" /> + <ngram occurrences="11" value="_pr" /> + <ngram occurrences="11" value="_nama" /> + <ngram occurrences="11" value="_cha" /> + <ngram occurrences="11" value="_bha" /> + <ngram occurrences="10" value="tra" /> + <ngram occurrences="10" value="nt" /> + <ngram occurrences="10" value="man" /> + <ngram occurrences="10" value="m_n" /> + <ngram occurrences="10" value="kh" /> + <ngram occurrences="10" value="kaa" /> + <ngram occurrences="10" value="jaa" /> + <ngram occurrences="10" value="ishh" /> + <ngram occurrences="10" value="ii_" /> + <ngram occurrences="10" value="i_t" /> + <ngram occurrences="10" value="hava" /> + <ngram occurrences="10" value="ed" /> + <ngram occurrences="10" value="aya_" /> + <ngram occurrences="10" value="apa" /> + <ngram occurrences="10" value="ami" /> + <ngram occurrences="10" value="aat" /> + <ngram occurrences="10" value="aas" /> + <ngram occurrences="10" value="a_g" /> + <ngram occurrences="10" value="a_d" /> + <ngram occurrences="10" value="_ta" /> + <ngram occurrences="10" value="_it" /> + <ngram occurrences="9" value="yo" /> + <ngram occurrences="9" value="yai" /> + <ngram occurrences="9" value="vaan" /> + <ngram occurrences="9" value="ut" /> + <ngram occurrences="9" value="un" /> + <ngram occurrences="9" value="u_" /> + <ngram occurrences="9" value="ti_" /> + <ngram occurrences="9" value="te_" /> + <ngram occurrences="9" value="taa_" /> + <ngram occurrences="9" value="ni_" /> + <ngram occurrences="9" value="nam_" /> + <ngram occurrences="9" value="mah" /> + <ngram occurrences="9" value="ke" /> + <ngram occurrences="9" value="jaan" /> + <ngram occurrences="9" value="i_s" /> + <ngram occurrences="9" value="hu" /> + <ngram occurrences="9" value="hr" /> + <ngram occurrences="9" value="he" /> + <ngram occurrences="9" value="hara" /> + <ngram occurrences="9" value="h_s" /> + <ngram occurrences="9" value="gy" /> + <ngram occurrences="9" value="dhi" /> + <ngram occurrences="9" value="avi" /> + <ngram occurrences="9" value="atha" /> + <ngram occurrences="9" value="ath" /> + <ngram occurrences="9" value="ame" /> + <ngram occurrences="9" value="am_n" /> + <ngram occurrences="9" value="ai_" /> + <ngram occurrences="9" value="aani" /> + <ngram occurrences="9" value="_va" /> + <ngram occurrences="9" value="_pra" /> + <ngram occurrences="9" value="_ka" /> + <ngram occurrences="8" value="ye_" /> + <ngram occurrences="8" value="yaan" /> + <ngram occurrences="8" value="ve" /> + <ngram occurrences="8" value="vam_" /> + <ngram occurrences="8" value="us" /> + <ngram occurrences="8" value="up" /> + <ngram occurrences="8" value="um" /> + <ngram occurrences="8" value="tvam" /> + <ngram occurrences="8" value="tat" /> + <ngram occurrences="8" value="tasya" /> + <ngram occurrences="8" value="tasy" /> + <ngram occurrences="8" value="tam" /> + <ngram occurrences="8" value="syai" /> + <ngram occurrences="8" value="rva" /> + <ngram occurrences="8" value="rv" /> + <ngram occurrences="8" value="ran" /> + <ngram occurrences="8" value="rama" /> + <ngram occurrences="8" value="raa" /> + <ngram occurrences="8" value="r_it" /> + <ngram occurrences="8" value="pu" /> + <ngram occurrences="8" value="na_n" /> + <ngram occurrences="8" value="mas" /> + <ngram occurrences="8" value="mar" /> + <ngram occurrences="8" value="ma_" /> + <ngram occurrences="8" value="ina" /> + <ngram occurrences="8" value="i_n" /> + <ngram occurrences="8" value="hit" /> + <ngram occurrences="8" value="hha" /> + <ngram occurrences="8" value="hch" /> + <ngram occurrences="8" value="hc" /> + <ngram occurrences="8" value="hat" /> + <ngram occurrences="8" value="h_p" /> + <ngram occurrences="8" value="e_s" /> + <ngram occurrences="8" value="e_p" /> + <ngram occurrences="8" value="bhav" /> + <ngram occurrences="8" value="asyai" /> + <ngram occurrences="8" value="asha" /> + <ngram occurrences="8" value="asa" /> + <ngram occurrences="8" value="art" /> + <ngram occurrences="8" value="are" /> + <ngram occurrences="8" value="ani_" /> + <ngram occurrences="8" value="anam_" /> + <ngram occurrences="8" value="amas" /> + <ngram occurrences="8" value="aar" /> + <ngram occurrences="8" value="aana_" /> + <ngram occurrences="8" value="a_p" /> + <ngram occurrences="8" value="a_ma" /> + <ngram occurrences="8" value="a_bh" /> + <ngram occurrences="8" value="a_a" /> + <ngram occurrences="8" value="_r" /> + <ngram occurrences="8" value="_par" /> + <ngram occurrences="8" value="_jaa" /> + <ngram occurrences="8" value="_dh" /> + <ngram occurrences="8" value="_da" /> + <ngram occurrences="8" value="_aham" /> + <ngram occurrences="8" value="_aha" /> + <ngram occurrences="8" value="_ah" /> + <ngram occurrences="7" value="yam_" /> + <ngram occurrences="7" value="yai_" /> + <ngram occurrences="7" value="yaana" /> + <ngram occurrences="7" value="xa" /> + <ngram occurrences="7" value="vat" /> + <ngram occurrences="7" value="tu" /> + <ngram occurrences="7" value="tan" /> + <ngram occurrences="7" value="stasy" /> + <ngram occurrences="7" value="stas" /> + <ngram occurrences="7" value="shi" /> + <ngram occurrences="7" value="saa" /> + <ngram occurrences="7" value="re_" /> + <ngram occurrences="7" value="rat" /> + <ngram occurrences="7" value="ram_" /> + <ngram occurrences="7" value="rah" /> + <ngram occurrences="7" value="pi" /> + <ngram occurrences="7" value="ny" /> + <ngram occurrences="7" value="nu" /> + <ngram occurrences="7" value="nas" /> + <ngram occurrences="7" value="jaana" /> + <ngram occurrences="7" value="ip" /> + <ngram occurrences="7" value="ika" /> + <ngram occurrences="7" value="iit" /> + <ngram occurrences="7" value="ih" /> + <ngram occurrences="7" value="ida" /> + <ngram occurrences="7" value="i_na" /> + <ngram occurrences="7" value="hva" /> + <ngram occurrences="7" value="hv" /> + <ngram occurrences="7" value="ho" /> + <ngram occurrences="7" value="hana" /> + <ngram occurrences="7" value="ha_n" /> + <ngram occurrences="7" value="gya" /> + <ngram occurrences="7" value="de" /> + <ngram occurrences="7" value="dar" /> + <ngram occurrences="7" value="cha_" /> + <ngram occurrences="7" value="bhava" /> + <ngram occurrences="7" value="ba" /> + <ngram occurrences="7" value="ate_" /> + <ngram occurrences="7" value="ate" /> + <ngram occurrences="7" value="astas" /> + <ngram occurrences="7" value="arva" /> + <ngram occurrences="7" value="arv" /> + <ngram occurrences="7" value="aru" /> + <ngram occurrences="7" value="aran" /> + <ngram occurrences="7" value="aram" /> + <ngram occurrences="7" value="api" /> + <ngram occurrences="7" value="amah" /> + <ngram occurrences="7" value="amaa" /> + <ngram occurrences="7" value="aja" /> + <ngram occurrences="7" value="ah_s" /> + <ngram occurrences="7" value="adhi" /> + <ngram occurrences="7" value="aaya" /> + <ngram occurrences="7" value="aanaa" /> + <ngram occurrences="7" value="aadh" /> + <ngram occurrences="7" value="a_nd" /> + <ngram occurrences="7" value="a_na" /> + <ngram occurrences="7" value="a_n_" /> +</ngrams> diff --git a/src/plugins/language/scots.klp b/src/plugins/language/scots.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="4021" value="_" /> + <ngram occurrences="2142" value="e" /> + <ngram occurrences="1716" value="a" /> + <ngram occurrences="1534" value="t" /> + <ngram occurrences="1229" value="i" /> + <ngram occurrences="1176" value="n" /> + <ngram occurrences="928" value="o" /> + <ngram occurrences="912" value="r" /> + <ngram occurrences="901" value="h" /> + <ngram occurrences="838" value="s" /> + <ngram occurrences="707" value="_a" /> + <ngram occurrences="639" value="e_" /> + <ngram occurrences="626" value="n_" /> + <ngram occurrences="621" value="_t" /> + <ngram occurrences="592" value="l" /> + <ngram occurrences="548" value="d" /> + <ngram occurrences="509" value="t_" /> + <ngram occurrences="475" value="th" /> + <ngram occurrences="447" value="w" /> + <ngram occurrences="413" value="he" /> + <ngram occurrences="409" value="_th" /> + <ngram occurrences="405" value="s_" /> + <ngram occurrences="377" value="an" /> + <ngram occurrences="356" value="u" /> + <ngram occurrences="356" value="a_" /> + <ngram occurrences="335" value="c" /> + <ngram occurrences="333" value="b" /> + <ngram occurrences="308" value="the" /> + <ngram occurrences="284" value="m" /> + <ngram occurrences="284" value="_the" /> + <ngram occurrences="282" value="_w" /> + <ngram occurrences="282" value="_s" /> + <ngram occurrences="279" value="g" /> + <ngram occurrences="279" value="ee" /> + <ngram occurrences="275" value="d_" /> + <ngram occurrences="274" value="in" /> + <ngram occurrences="273" value="r_" /> + <ngram occurrences="272" value="_a_" /> + <ngram occurrences="270" value="er" /> + <ngram occurrences="261" value="_b" /> + <ngram occurrences="258" value="f" /> + <ngram occurrences="255" value="an_" /> + <ngram occurrences="253" value="y" /> + <ngram occurrences="250" value="k" /> + <ngram occurrences="248" value="_o" /> + <ngram occurrences="242" value="the_" /> + <ngram occurrences="242" value="he_" /> + <ngram occurrences="241" value="_the_" /> + <ngram occurrences="236" value="_an" /> + <ngram occurrences="223" value="_an_" /> + <ngram occurrences="202" value="i_" /> + <ngram occurrences="179" value="en" /> + <ngram occurrences="172" value="p" /> + <ngram occurrences="171" value="wa" /> + <ngram occurrences="166" value="in_" /> + <ngram occurrences="162" value="_f" /> + <ngram occurrences="157" value="re" /> + <ngram occurrences="156" value="_m" /> + <ngram occurrences="152" value="ei" /> + <ngram occurrences="149" value="it" /> + <ngram occurrences="148" value="te" /> + <ngram occurrences="146" value="et" /> + <ngram occurrences="145" value="as" /> + <ngram occurrences="144" value="_h" /> + <ngram occurrences="143" value="_wa" /> + <ngram occurrences="141" value="_d" /> + <ngram occurrences="139" value="oo" /> + <ngram occurrences="139" value="_i" /> + <ngram occurrences="138" value="ti" /> + <ngram occurrences="136" value="le" /> + <ngram occurrences="136" value="er_" /> + <ngram occurrences="135" value="ui" /> + <ngram occurrences="131" value="ai" /> + <ngram occurrences="130" value="o_" /> + <ngram occurrences="129" value="ha" /> + <ngram occurrences="126" value="at" /> + <ngram occurrences="124" value="on" /> + <ngram occurrences="122" value="_g" /> + <ngram occurrences="121" value="or" /> + <ngram occurrences="120" value="y_" /> + <ngram occurrences="120" value="_c" /> + <ngram occurrences="118" value="n_t" /> + <ngram occurrences="118" value="n_a" /> + <ngram occurrences="115" value="_l" /> + <ngram occurrences="111" value="h_" /> + <ngram occurrences="110" value="s_a" /> + <ngram occurrences="110" value="as_" /> + <ngram occurrences="109" value="ch" /> + <ngram occurrences="107" value="t_a" /> + <ngram occurrences="104" value="st" /> + <ngram occurrences="103" value="_ti" /> + <ngram occurrences="99" value="e_a" /> + <ngram occurrences="99" value="_o_" /> + <ngram occurrences="98" value="en_" /> + <ngram occurrences="97" value="ti_" /> + <ngram occurrences="95" value="ow" /> + <ngram occurrences="95" value="ke" /> + <ngram occurrences="90" value="t_t" /> + <ngram occurrences="90" value="_ti_" /> + <ngram occurrences="90" value="_r" /> + <ngram occurrences="89" value="es" /> + <ngram occurrences="89" value="ed" /> + <ngram occurrences="89" value="at_" /> + <ngram occurrences="88" value="ae" /> + <ngram occurrences="87" value="_n" /> + <ngram occurrences="86" value="ra" /> + <ngram occurrences="85" value="et_" /> + <ngram occurrences="84" value="ie" /> + <ngram occurrences="83" value="nd" /> + <ngram occurrences="82" value="on_" /> + <ngram occurrences="82" value="it_" /> + <ngram occurrences="82" value="een" /> + <ngram occurrences="81" value="_e" /> + <ngram occurrences="80" value="n_th" /> + <ngram occurrences="78" value="was" /> + <ngram occurrences="78" value="ma" /> + <ngram occurrences="78" value="fo" /> + <ngram occurrences="78" value="el" /> + <ngram occurrences="78" value="eet" /> + <ngram occurrences="78" value="ar" /> + <ngram occurrences="78" value="_was" /> + <ngram occurrences="77" value="her" /> + <ngram occurrences="76" value="ot" /> + <ngram occurrences="76" value="or_" /> + <ngram occurrences="76" value="nt" /> + <ngram occurrences="76" value="l_" /> + <ngram occurrences="76" value="ir" /> + <ngram occurrences="75" value="eet_" /> + <ngram occurrences="75" value="_fo" /> + <ngram occurrences="74" value="la" /> + <ngram occurrences="73" value="se" /> + <ngram occurrences="73" value="ll" /> + <ngram occurrences="73" value="is" /> + <ngram occurrences="73" value="_ma" /> + <ngram occurrences="71" value="was_" /> + <ngram occurrences="71" value="_y" /> + <ngram occurrences="71" value="_was_" /> + <ngram occurrences="70" value="k_" /> + <ngram occurrences="70" value="ed_" /> + <ngram occurrences="70" value="de" /> + <ngram occurrences="69" value="tha" /> + <ngram occurrences="68" value="ne" /> + <ngram occurrences="67" value="ic" /> + <ngram occurrences="66" value="me" /> + <ngram occurrences="65" value="li" /> + <ngram occurrences="65" value="aa" /> + <ngram occurrences="64" value="ht" /> + <ngram occurrences="63" value="wu" /> + <ngram occurrences="63" value="we" /> + <ngram occurrences="63" value="v" /> + <ngram occurrences="63" value="t_th" /> + <ngram occurrences="63" value="_p" /> + <ngram occurrences="62" value="ro" /> + <ngram occurrences="62" value="hi" /> + <ngram occurrences="62" value="e_b" /> + <ngram occurrences="62" value="_wu" /> + <ngram occurrences="60" value="e_t" /> + <ngram occurrences="60" value="bo" /> + <ngram occurrences="59" value="re_" /> + <ngram occurrences="59" value="een_" /> + <ngram occurrences="59" value="cht" /> + <ngram occurrences="58" value="il" /> + <ngram occurrences="58" value="for" /> + <ngram occurrences="58" value="_he" /> + <ngram occurrences="57" value="es_" /> + <ngram occurrences="56" value="rt" /> + <ngram occurrences="56" value="ri" /> + <ngram occurrences="56" value="n_a_" /> + <ngram occurrences="56" value="i_t" /> + <ngram occurrences="55" value="ter" /> + <ngram occurrences="55" value="_for" /> + <ngram occurrences="54" value="ther" /> + <ngram occurrences="54" value="bi" /> + <ngram occurrences="54" value="_tha" /> + <ngram occurrences="54" value="_st" /> + <ngram occurrences="54" value="_on" /> + <ngram occurrences="53" value="s_an_" /> + <ngram occurrences="53" value="s_an" /> + <ngram occurrences="53" value="r_a" /> + <ngram occurrences="53" value="ng" /> + <ngram occurrences="53" value="n_the" /> + <ngram occurrences="52" value="nd_" /> + <ngram occurrences="52" value="ht_" /> + <ngram occurrences="52" value="a_w" /> + <ngram occurrences="51" value="tt" /> + <ngram occurrences="51" value="ge" /> + <ngram occurrences="51" value="ga" /> + <ngram occurrences="51" value="d_t" /> + <ngram occurrences="51" value="ck" /> + <ngram occurrences="51" value="_bi" /> + <ngram occurrences="51" value="_a_w" /> + <ngram occurrences="50" value="id" /> + <ngram occurrences="50" value="be" /> + <ngram occurrences="49" value="t_the" /> + <ngram occurrences="49" value="n_o" /> + <ngram occurrences="48" value="s_t" /> + <ngram occurrences="48" value="ot_" /> + <ngram occurrences="48" value="ho" /> + <ngram occurrences="48" value="e_w" /> + <ngram occurrences="48" value="ad" /> + <ngram occurrences="48" value="_k" /> + <ngram occurrences="47" value="t_w" /> + <ngram occurrences="47" value="na" /> + <ngram occurrences="47" value="i_th" /> + <ngram occurrences="47" value="hat" /> + <ngram occurrences="47" value="cht_" /> + <ngram occurrences="47" value="br" /> + <ngram occurrences="47" value="_on_" /> + <ngram occurrences="46" value="ye" /> + <ngram occurrences="46" value="t_a_" /> + <ngram occurrences="46" value="n_s" /> + <ngram occurrences="46" value="g_" /> + <ngram occurrences="46" value="al" /> + <ngram occurrences="46" value="_it" /> + <ngram occurrences="46" value="_br" /> + <ngram occurrences="45" value="z" /> + <ngram occurrences="45" value="ui_" /> + <ngram occurrences="45" value="hat_" /> + <ngram occurrences="45" value="eh" /> + <ngram occurrences="44" value="yi" /> + <ngram occurrences="44" value="wh" /> + <ngram occurrences="44" value="pe" /> + <ngram occurrences="44" value="o_t" /> + <ngram occurrences="44" value="le_" /> + <ngram occurrences="44" value="for_" /> + <ngram occurrences="44" value="e_s" /> + <ngram occurrences="44" value="an_t" /> + <ngram occurrences="44" value="ae_" /> + <ngram occurrences="44" value="_wh" /> + <ngram occurrences="44" value="_for_" /> + <ngram occurrences="43" value="j" /> + <ngram occurrences="43" value="ay" /> + <ngram occurrences="43" value="air" /> + <ngram occurrences="43" value="_be" /> + <ngram occurrences="42" value="wui" /> + <ngram occurrences="42" value="ts" /> + <ngram occurrences="42" value="that_" /> + <ngram occurrences="42" value="that" /> + <ngram occurrences="42" value="i_the" /> + <ngram occurrences="42" value="_wui" /> + <ngram occurrences="42" value="_that" /> + <ngram occurrences="41" value="wui_" /> + <ngram occurrences="41" value="un" /> + <ngram occurrences="41" value="tee" /> + <ngram occurrences="41" value="oot" /> + <ngram occurrences="41" value="od" /> + <ngram occurrences="41" value="ie_" /> + <ngram occurrences="41" value="ca" /> + <ngram occurrences="41" value="_wui_" /> + <ngram occurrences="41" value="_le" /> + <ngram occurrences="41" value="_bo" /> + <ngram occurrences="40" value="ts_" /> + <ngram occurrences="40" value="rt_" /> + <ngram occurrences="40" value="r_t" /> + <ngram occurrences="39" value="the_b" /> + <ngram occurrences="39" value="nt_" /> + <ngram occurrences="39" value="no" /> + <ngram occurrences="39" value="m_" /> + <ngram occurrences="39" value="he_b" /> + <ngram occurrences="39" value="ere" /> + <ngram occurrences="39" value="eh_" /> + <ngram occurrences="39" value="an_a" /> + <ngram occurrences="39" value="ad_" /> + <ngram occurrences="39" value="a_wa" /> + <ngram occurrences="38" value="ter_" /> + <ngram occurrences="38" value="t_s" /> + <ngram occurrences="38" value="s_a_" /> + <ngram occurrences="38" value="rr" /> + <ngram occurrences="38" value="e_o" /> + <ngram occurrences="38" value="e_a_" /> + <ngram occurrences="38" value="_yi" /> + <ngram occurrences="38" value="_ga" /> + <ngram occurrences="38" value="_as" /> + <ngram occurrences="38" value="_a_wa" /> + <ngram occurrences="37" value="t_o" /> + <ngram occurrences="37" value="sh" /> + <ngram occurrences="37" value="oa" /> + <ngram occurrences="37" value="ni" /> + <ngram occurrences="37" value="in_a" /> + <ngram occurrences="37" value="d_a" /> + <ngram occurrences="37" value="co" /> + <ngram occurrences="37" value="_in" /> + <ngram occurrences="37" value="_at" /> + <ngram occurrences="37" value="_as_" /> + <ngram occurrences="37" value="_an_t" /> + <ngram occurrences="36" value="ree" /> + <ngram occurrences="36" value="rd" /> + <ngram occurrences="36" value="o_th" /> + <ngram occurrences="36" value="ng_" /> + <ngram occurrences="36" value="ik" /> + <ngram occurrences="36" value="ei_" /> + <ngram occurrences="36" value="e_m" /> + <ngram occurrences="36" value="da" /> + <ngram occurrences="36" value="bit" /> + <ngram occurrences="36" value="au" /> + <ngram occurrences="36" value="_j" /> + <ngram occurrences="36" value="_ca" /> + <ngram occurrences="35" value="w_" /> + <ngram occurrences="35" value="so" /> + <ngram occurrences="35" value="oon" /> + <ngram occurrences="35" value="nn" /> + <ngram occurrences="35" value="n_f" /> + <ngram occurrences="35" value="ll_" /> + <ngram occurrences="35" value="fi" /> + <ngram occurrences="35" value="_ro" /> + <ngram occurrences="35" value="_bit" /> + <ngram occurrences="34" value="tr" /> + <ngram occurrences="34" value="st_" /> + <ngram occurrences="34" value="oot_" /> + <ngram occurrences="34" value="n_b" /> + <ngram occurrences="34" value="ill" /> + <ngram occurrences="34" value="her_" /> + <ngram occurrences="34" value="ea" /> + <ngram occurrences="34" value="e_th" /> + <ngram occurrences="34" value="a_t" /> + <ngram occurrences="34" value="a_s" /> + <ngram occurrences="34" value="_o_t" /> + <ngram occurrences="33" value="ther_" /> + <ngram occurrences="33" value="t_an" /> + <ngram occurrences="33" value="ns" /> + <ngram occurrences="33" value="lo" /> + <ngram occurrences="33" value="ich" /> + <ngram occurrences="33" value="_s_" /> + <ngram occurrences="33" value="_me" /> + <ngram occurrences="32" value="ur" /> + <ngram occurrences="32" value="ki" /> + <ngram occurrences="32" value="as_a" /> + <ngram occurrences="32" value="an_th" /> + <ngram occurrences="32" value="_ther" /> + <ngram occurrences="32" value="_it_" /> + <ngram occurrences="31" value="ve" /> + <ngram occurrences="31" value="um" /> + <ngram occurrences="31" value="thi" /> + <ngram occurrences="31" value="ta" /> + <ngram occurrences="31" value="t_an_" /> + <ngram occurrences="31" value="p_" /> + <ngram occurrences="31" value="n_w" /> + <ngram occurrences="31" value="han" /> + <ngram occurrences="31" value="fe" /> + <ngram occurrences="31" value="ba" /> + <ngram occurrences="31" value="aw" /> + <ngram occurrences="31" value="ang" /> + <ngram occurrences="31" value="a_was" /> + <ngram occurrences="31" value="_se" /> + <ngram occurrences="31" value="_o_th" /> + <ngram occurrences="31" value="_la" /> + <ngram occurrences="31" value="_ha" /> + <ngram occurrences="31" value="_da" /> + <ngram occurrences="31" value="_at_" /> + <ngram occurrences="30" value="to" /> + <ngram occurrences="30" value="icht" /> + <ngram occurrences="30" value="der" /> + <ngram occurrences="30" value="d_th" /> + <ngram occurrences="30" value="ce" /> + <ngram occurrences="30" value="bit_" /> + <ngram occurrences="30" value="_co" /> + <ngram occurrences="29" value="tte" /> + <ngram occurrences="29" value="t_wa" /> + <ngram occurrences="29" value="si" /> + <ngram occurrences="29" value="s_th" /> + <ngram occurrences="29" value="owe" /> + <ngram occurrences="29" value="ir_" /> + <ngram occurrences="29" value="hin" /> + <ngram occurrences="29" value="here" /> + <ngram occurrences="29" value="h_a" /> + <ngram occurrences="29" value="er_a" /> + <ngram occurrences="29" value="eed" /> + <ngram occurrences="29" value="bra" /> + <ngram occurrences="29" value="ay_" /> + <ngram occurrences="29" value="an_a_" /> + <ngram occurrences="29" value="a_d" /> + <ngram occurrences="29" value="_ke" /> + <ngram occurrences="29" value="_bra" /> + <ngram occurrences="29" value="_bit_" /> + <ngram occurrences="29" value="_ba" /> + <ngram occurrences="28" value="wee" /> + <ngram occurrences="28" value="tu" /> + <ngram occurrences="28" value="thr" /> + <ngram occurrences="28" value="s_w" /> + <ngram occurrences="28" value="s_o" /> + <ngram occurrences="28" value="n_an" /> + <ngram occurrences="28" value="ma_" /> + <ngram occurrences="28" value="lei" /> + <ngram occurrences="28" value="ld" /> + <ngram occurrences="28" value="lan" /> + <ngram occurrences="28" value="ke_" /> + <ngram occurrences="28" value="in_t" /> + <ngram occurrences="28" value="im" /> + <ngram occurrences="28" value="hr" /> + <ngram occurrences="28" value="here_" /> + <ngram occurrences="28" value="gi" /> + <ngram occurrences="28" value="eth" /> + <ngram occurrences="28" value="ere_" /> + <ngram occurrences="28" value="eik" /> + <ngram occurrences="28" value="do" /> + <ngram occurrences="28" value="bu" /> + <ngram occurrences="28" value="ab" /> + <ngram occurrences="28" value="a_b" /> + <ngram occurrences="28" value="_ma_" /> + <ngram occurrences="27" value="rn" /> +</ngrams> diff --git a/src/plugins/language/scots_gaelic.klp b/src/plugins/language/scots_gaelic.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="466" value="_" /> + <ngram occurrences="383" value="a" /> + <ngram occurrences="237" value="h" /> + <ngram occurrences="222" value="i" /> + <ngram occurrences="190" value="n" /> + <ngram occurrences="126" value="e" /> + <ngram occurrences="122" value="d" /> + <ngram occurrences="119" value="r" /> + <ngram occurrences="107" value="_a" /> + <ngram occurrences="97" value="g" /> + <ngram occurrences="93" value="c" /> + <ngram occurrences="89" value="n_" /> + <ngram occurrences="87" value="h_" /> + <ngram occurrences="86" value="t" /> + <ngram occurrences="85" value="s" /> + <ngram occurrences="81" value="l" /> + <ngram occurrences="75" value="a_" /> + <ngram occurrences="73" value="an" /> + <ngram occurrences="71" value="u" /> + <ngram occurrences="67" value="ai" /> + <ngram occurrences="64" value="ch" /> + <ngram occurrences="58" value="o" /> + <ngram occurrences="55" value="ea" /> + <ngram occurrences="55" value="dh" /> + <ngram occurrences="54" value="ha" /> + <ngram occurrences="53" value="b" /> + <ngram occurrences="47" value="_c" /> + <ngram occurrences="45" value="_t" /> + <ngram occurrences="44" value="an_" /> + <ngram occurrences="42" value="r_" /> + <ngram occurrences="42" value="m" /> + <ngram occurrences="41" value="id" /> + <ngram occurrences="40" value="na" /> + <ngram occurrences="38" value="th" /> + <ngram occurrences="38" value="ir" /> + <ngram occurrences="36" value="_g" /> + <ngram occurrences="36" value="_b" /> + <ngram occurrences="35" value="à" /> + <ngram occurrences="34" value="s_" /> + <ngram occurrences="33" value="nn" /> + <ngram occurrences="33" value="ac" /> + <ngram occurrences="31" value="idh" /> + <ngram occurrences="31" value="dh_" /> + <ngram occurrences="31" value="ach" /> + <ngram occurrences="30" value="n_a" /> + <ngram occurrences="30" value="ad" /> + <ngram occurrences="29" value="_an" /> + <ngram occurrences="29" value="_a_" /> + <ngram occurrences="28" value="in" /> + <ngram occurrences="28" value="ei" /> + <ngram occurrences="28" value="d_" /> + <ngram occurrences="28" value="bh" /> + <ngram occurrences="28" value="_s" /> + <ngram occurrences="26" value="he" /> + <ngram occurrences="26" value="gh" /> + <ngram occurrences="25" value="nn_" /> + <ngram occurrences="24" value="ig" /> + <ngram occurrences="24" value="h_a" /> + <ngram occurrences="24" value="gu" /> + <ngram occurrences="24" value="_n" /> + <ngram occurrences="24" value="_d" /> + <ngram occurrences="23" value="ir_" /> + <ngram occurrences="23" value="_ch" /> + <ngram occurrences="22" value="il" /> + <ngram occurrences="22" value="_e" /> + <ngram occurrences="22" value="_ai" /> + <ngram occurrences="21" value="ean" /> + <ngram occurrences="21" value="_th" /> + <ngram occurrences="20" value="f" /> + <ngram occurrences="20" value="cha" /> + <ngram occurrences="20" value="ann" /> + <ngram occurrences="19" value="ài" /> + <ngram occurrences="19" value="ha_" /> + <ngram occurrences="19" value="g_" /> + <ngram occurrences="19" value="e_" /> + <ngram occurrences="19" value="ar" /> + <ngram occurrences="19" value="air" /> + <ngram occurrences="19" value="ag" /> + <ngram occurrences="19" value="_na" /> + <ngram occurrences="19" value="_f" /> + <ngram occurrences="18" value="is" /> + <ngram occurrences="18" value="_an_" /> + <ngram occurrences="17" value="ann_" /> + <ngram occurrences="17" value="_r" /> + <ngram occurrences="16" value="ui" /> + <ngram occurrences="16" value="tha" /> + <ngram occurrences="16" value="la" /> + <ngram occurrences="16" value="as" /> + <ngram occurrences="15" value="us_" /> + <ngram occurrences="15" value="us" /> + <ngram occurrences="15" value="oi" /> + <ngram occurrences="15" value="l_" /> + <ngram occurrences="15" value="ig_" /> + <ngram occurrences="15" value="hai" /> + <ngram occurrences="15" value="gus_" /> + <ngram occurrences="15" value="gus" /> + <ngram occurrences="15" value="da" /> + <ngram occurrences="15" value="ch_" /> + <ngram occurrences="15" value="am" /> + <ngram occurrences="15" value="air_" /> + <ngram occurrences="15" value="aid" /> + <ngram occurrences="15" value="adh" /> + <ngram occurrences="15" value="_i" /> + <ngram occurrences="15" value="_bh" /> + <ngram occurrences="14" value="tha_" /> + <ngram occurrences="14" value="ta" /> + <ngram occurrences="14" value="ri" /> + <ngram occurrences="14" value="na_" /> + <ngram occurrences="14" value="m_" /> + <ngram occurrences="14" value="le" /> + <ngram occurrences="14" value="idh_" /> + <ngram occurrences="14" value="gh_" /> + <ngram occurrences="14" value="eac" /> + <ngram occurrences="14" value="an_a" /> + <ngram occurrences="14" value="_na_" /> + <ngram occurrences="13" value="on" /> + <ngram occurrences="13" value="hea" /> + <ngram occurrences="13" value="agus_" /> + <ngram occurrences="13" value="agus" /> + <ngram occurrences="13" value="agu" /> + <ngram occurrences="13" value="_tha_" /> + <ngram occurrences="13" value="_tha" /> + <ngram occurrences="13" value="_agus" /> + <ngram occurrences="13" value="_agu" /> + <ngram occurrences="13" value="_ag" /> + <ngram occurrences="12" value="n_an" /> + <ngram occurrences="12" value="hu" /> + <ngram occurrences="12" value="hl" /> + <ngram occurrences="12" value="hi" /> + <ngram occurrences="12" value="each" /> + <ngram occurrences="12" value="ao" /> + <ngram occurrences="12" value="al" /> + <ngram occurrences="12" value="aidh" /> + <ngram occurrences="12" value="adh_" /> + <ngram occurrences="12" value="ach_" /> + <ngram occurrences="12" value="a_g" /> + <ngram occurrences="12" value="_air" /> + <ngram occurrences="11" value="àidh" /> + <ngram occurrences="11" value="àid" /> + <ngram occurrences="11" value="te" /> + <ngram occurrences="11" value="rd" /> + <ngram occurrences="11" value="r_a" /> + <ngram occurrences="11" value="nn_a" /> + <ngram occurrences="11" value="ma" /> + <ngram occurrences="11" value="hd" /> + <ngram occurrences="11" value="eil" /> + <ngram occurrences="11" value="ean_" /> + <ngram occurrences="11" value="chd" /> + <ngram occurrences="11" value="aig" /> + <ngram occurrences="11" value="_gu" /> + <ngram occurrences="11" value="_ann_" /> + <ngram occurrences="11" value="_ann" /> + <ngram occurrences="11" value="_air_" /> + <ngram occurrences="10" value="u_" /> + <ngram occurrences="10" value="t_" /> + <ngram occurrences="10" value="p" /> + <ngram occurrences="10" value="ne" /> + <ngram occurrences="10" value="n_c" /> + <ngram occurrences="10" value="ith" /> + <ngram occurrences="10" value="it" /> + <ngram occurrences="10" value="inn" /> + <ngram occurrences="10" value="chai" /> + <ngram occurrences="10" value="ar_" /> + <ngram occurrences="10" value="ann_a" /> + <ngram occurrences="10" value="am_" /> + <ngram occurrences="10" value="aidh_" /> + <ngram occurrences="10" value="achd" /> + <ngram occurrences="10" value="a_c" /> + <ngram occurrences="10" value="_l" /> + <ngram occurrences="9" value="ò" /> + <ngram occurrences="9" value="ua" /> + <ngram occurrences="9" value="th_" /> + <ngram occurrences="9" value="se" /> + <ngram occurrences="9" value="sa" /> + <ngram occurrences="9" value="n_an_" /> + <ngram occurrences="9" value="mh" /> + <ngram occurrences="9" value="li" /> + <ngram occurrences="9" value="lea" /> + <ngram occurrences="9" value="is_" /> + <ngram occurrences="9" value="ia" /> + <ngram occurrences="9" value="gàidh" /> + <ngram occurrences="9" value="gàid" /> + <ngram occurrences="9" value="gài" /> + <ngram occurrences="9" value="gà" /> + <ngram occurrences="9" value="ga" /> + <ngram occurrences="9" value="dh_a" /> + <ngram occurrences="9" value="ad_" /> + <ngram occurrences="9" value="acha" /> + <ngram occurrences="9" value="_gàid" /> + <ngram occurrences="9" value="_gài" /> + <ngram occurrences="9" value="_gà" /> + <ngram occurrences="9" value="_ei" /> + <ngram occurrences="8" value="ì" /> + <ngram occurrences="8" value="àr" /> + <ngram occurrences="8" value="sg" /> + <ngram occurrences="8" value="s_a" /> + <ngram occurrences="8" value="re" /> + <ngram occurrences="8" value="ra" /> + <ngram occurrences="8" value="lt" /> + <ngram occurrences="8" value="lig" /> + <ngram occurrences="8" value="io" /> + <ngram occurrences="8" value="ho" /> + <ngram occurrences="8" value="hli" /> + <ngram occurrences="8" value="hei" /> + <ngram occurrences="8" value="haid" /> + <ngram occurrences="8" value="dhl" /> + <ngram occurrences="8" value="dhe" /> + <ngram occurrences="8" value="bhe" /> + <ngram occurrences="8" value="ba" /> + <ngram occurrences="8" value="ain" /> + <ngram occurrences="8" value="a_b" /> + <ngram occurrences="8" value="_ta" /> + <ngram occurrences="8" value="_cha" /> + <ngram occurrences="7" value="ù" /> + <ngram occurrences="7" value="àidhl" /> + <ngram occurrences="7" value="o_" /> + <ngram occurrences="7" value="nn_an" /> + <ngram occurrences="7" value="n_e" /> + <ngram occurrences="7" value="lig_" /> + <ngram occurrences="7" value="in_" /> + <ngram occurrences="7" value="il_" /> + <ngram occurrences="7" value="igh" /> + <ngram occurrences="7" value="idhli" /> + <ngram occurrences="7" value="idhl" /> + <ngram occurrences="7" value="idhe" /> + <ngram occurrences="7" value="hui" /> + <ngram occurrences="7" value="hlig_" /> + <ngram occurrences="7" value="hlig" /> + <ngram occurrences="7" value="hd_" /> + <ngram occurrences="7" value="h_t" /> + <ngram occurrences="7" value="h_b" /> + <ngram occurrences="7" value="fh" /> + <ngram occurrences="7" value="fa" /> + <ngram occurrences="7" value="du" /> + <ngram occurrences="7" value="dhlig" /> + <ngram occurrences="7" value="dhli" /> + <ngram occurrences="7" value="chd_" /> + <ngram occurrences="7" value="chaid" /> + <ngram occurrences="7" value="bh_" /> + <ngram occurrences="7" value="at" /> + <ngram occurrences="7" value="_se" /> + <ngram occurrences="7" value="_gh" /> + <ngram occurrences="7" value="_fa" /> + <ngram occurrences="7" value="_dh" /> + <ngram occurrences="7" value="_aig" /> + <ngram occurrences="6" value="ur" /> + <ngram occurrences="6" value="un" /> + <ngram occurrences="6" value="tr" /> + <ngram occurrences="6" value="s_n" /> + <ngram occurrences="6" value="ri_" /> + <ngram occurrences="6" value="rd_" /> + <ngram occurrences="6" value="ona" /> + <ngram occurrences="6" value="on_" /> + <ngram occurrences="6" value="oin" /> + <ngram occurrences="6" value="nea" /> + <ngram occurrences="6" value="nan" /> + <ngram occurrences="6" value="nam" /> + <ngram occurrences="6" value="n_t" /> + <ngram occurrences="6" value="n_g" /> + <ngram occurrences="6" value="n_ei" /> + <ngram occurrences="6" value="n_a_" /> + <ngram occurrences="6" value="m_b" /> + <ngram occurrences="6" value="l_a" /> + <ngram occurrences="6" value="ir_a" /> + <ngram occurrences="6" value="ilt" /> + <ngram occurrences="6" value="ile" /> + <ngram occurrences="6" value="igh_" /> + <ngram occurrences="6" value="ig_a" /> + <ngram occurrences="6" value="ic" /> + <ngram occurrences="6" value="i_" /> + <ngram occurrences="6" value="hà" /> + <ngram occurrences="6" value="han" /> + <ngram occurrences="6" value="haidh" /> + <ngram occurrences="6" value="h_c" /> + <ngram occurrences="6" value="h_ai" /> + <ngram occurrences="6" value="h_a_" /> + <ngram occurrences="6" value="gu_" /> + <ngram occurrences="6" value="gha" /> + <ngram occurrences="6" value="g_a" /> + <ngram occurrences="6" value="eir" /> + <ngram occurrences="6" value="e_t" /> + <ngram occurrences="6" value="de" /> + <ngram occurrences="6" value="d_a" /> + <ngram occurrences="6" value="ce" /> + <ngram occurrences="6" value="aoi" /> + <ngram occurrences="6" value="ana" /> + <ngram occurrences="6" value="an_c" /> + <ngram occurrences="6" value="am_b" /> + <ngram occurrences="6" value="ain_" /> + <ngram occurrences="6" value="aig_" /> + <ngram occurrences="6" value="agh" /> + <ngram occurrences="6" value="ada" /> + <ngram occurrences="6" value="achd_" /> + <ngram occurrences="6" value="a_t" /> + <ngram occurrences="6" value="a_d" /> + <ngram occurrences="6" value="a_a" /> + <ngram occurrences="6" value="_tr" /> + <ngram occurrences="6" value="_ri" /> + <ngram occurrences="6" value="_p" /> + <ngram occurrences="6" value="_m" /> + <ngram occurrences="6" value="_io" /> + <ngram occurrences="6" value="_h_" /> + <ngram occurrences="6" value="_h" /> + <ngram occurrences="6" value="_gu_" /> + <ngram occurrences="6" value="_fh" /> + <ngram occurrences="6" value="_ea" /> + <ngram occurrences="6" value="_du" /> + <ngram occurrences="6" value="_ce" /> + <ngram occurrences="6" value="_bhe" /> + <ngram occurrences="6" value="_am_" /> + <ngram occurrences="6" value="_am" /> + <ngram occurrences="6" value="_aig_" /> + <ngram occurrences="5" value="è" /> + <ngram occurrences="5" value="us_a" /> + <ngram occurrences="5" value="un_" /> + <ngram occurrences="5" value="thu" /> + <ngram occurrences="5" value="the" /> + <ngram occurrences="5" value="tai" /> + <ngram occurrences="5" value="si" /> + <ngram occurrences="5" value="s_c" /> + <ngram occurrences="5" value="s_a_" /> + <ngram occurrences="5" value="rt" /> + <ngram occurrences="5" value="ro" /> + <ngram occurrences="5" value="oine" /> + <ngram occurrences="5" value="ob" /> + <ngram occurrences="5" value="ni" /> + <ngram occurrences="5" value="neach" /> + <ngram occurrences="5" value="neac" /> + <ngram occurrences="5" value="nan_" /> + <ngram occurrences="5" value="nach" /> + <ngram occurrences="5" value="nac" /> + <ngram occurrences="5" value="n_d" /> + <ngram occurrences="5" value="n_b" /> + <ngram occurrences="5" value="ll" /> + <ngram occurrences="5" value="ithe" /> + <ngram occurrences="5" value="inn_" /> + <ngram occurrences="5" value="ine" /> + <ngram occurrences="5" value="im" /> + <ngram occurrences="5" value="ilea" /> + <ngram occurrences="5" value="idhea" /> + <ngram occurrences="5" value="id_" /> + <ngram occurrences="5" value="ich" /> + <ngram occurrences="5" value="iad_" /> + <ngram occurrences="5" value="iad" /> + <ngram occurrences="5" value="hean_" /> + <ngram occurrences="5" value="hean" /> + <ngram occurrences="5" value="han_" /> + <ngram occurrences="5" value="had" /> + <ngram occurrences="5" value="h_s" /> + <ngram occurrences="5" value="h_g" /> + <ngram occurrences="5" value="h_agu" /> + <ngram occurrences="5" value="h_ag" /> + <ngram occurrences="5" value="gus_a" /> + <ngram occurrences="5" value="eu" /> + <ngram occurrences="5" value="eo" /> + <ngram occurrences="5" value="eile" /> + <ngram occurrences="5" value="eann_" /> + <ngram occurrences="5" value="eann" /> + <ngram occurrences="5" value="eal" /> + <ngram occurrences="5" value="ead" /> + <ngram occurrences="5" value="eacha" /> + <ngram occurrences="5" value="e_a" /> + <ngram occurrences="5" value="dhea" /> + <ngram occurrences="5" value="chu" /> + <ngram occurrences="5" value="chi" /> + <ngram occurrences="5" value="bar" /> + <ngram occurrences="5" value="ath" /> + <ngram occurrences="5" value="as_" /> + <ngram occurrences="5" value="aoine" /> + <ngram occurrences="5" value="aoin" /> + <ngram occurrences="5" value="a_r" /> + <ngram occurrences="5" value="a_n" /> + <ngram occurrences="5" value="a_gài" /> + <ngram occurrences="5" value="a_gà" /> + <ngram occurrences="5" value="a_ch" /> + <ngram occurrences="5" value="a_bh" /> + <ngram occurrences="5" value="_thu" /> + <ngram occurrences="5" value="_ia" /> + <ngram occurrences="5" value="_eile" /> + <ngram occurrences="5" value="_eil" /> + <ngram occurrences="5" value="_chi" /> + <ngram occurrences="5" value="_bar" /> + <ngram occurrences="5" value="_ba" /> + <ngram occurrences="5" value="_a_t" /> + <ngram occurrences="5" value="_a_g" /> + <ngram occurrences="5" value="_a_d" /> + <ngram occurrences="5" value="_a_c" /> + <ngram occurrences="4" value="àrd" /> + <ngram occurrences="4" value="àna" /> + <ngram occurrences="4" value="àn" /> + <ngram occurrences="4" value="àidhe" /> + <ngram occurrences="4" value="uir" /> + <ngram occurrences="4" value="uid" /> + <ngram occurrences="4" value="thui" /> + <ngram occurrences="4" value="thea" /> + <ngram occurrences="4" value="st" /> + <ngram occurrences="4" value="sma" /> + <ngram occurrences="4" value="sm" /> + <ngram occurrences="4" value="sga" /> + <ngram occurrences="4" value="sea" /> +</ngrams> diff --git a/src/plugins/language/serbian.klp b/src/plugins/language/serbian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="819" value="_" /> + <ngram occurrences="420" value="a" /> + <ngram occurrences="416" value="o" /> + <ngram occurrences="378" value="i" /> + <ngram occurrences="335" value="e" /> + <ngram occurrences="262" value="n" /> + <ngram occurrences="225" value="s" /> + <ngram occurrences="197" value="t" /> + <ngram occurrences="195" value="j" /> + <ngram occurrences="178" value="a_" /> + <ngram occurrences="166" value="u" /> + <ngram occurrences="154" value="r" /> + <ngram occurrences="151" value="d" /> + <ngram occurrences="148" value="e_" /> + <ngram occurrences="147" value="l" /> + <ngram occurrences="134" value="v" /> + <ngram occurrences="125" value="y" /> + <ngram occurrences="124" value="m" /> + <ngram occurrences="123" value="o_" /> + <ngram occurrences="116" value="k" /> + <ngram occurrences="115" value="p" /> + <ngram occurrences="101" value="i_" /> + <ngram occurrences="96" value="je" /> + <ngram occurrences="94" value="z" /> + <ngram occurrences="93" value="c" /> + <ngram occurrences="90" value="_s" /> + <ngram occurrences="84" value="u_" /> + <ngram occurrences="81" value="_p" /> + <ngram occurrences="78" value="b" /> + <ngram occurrences="78" value="_n" /> + <ngram occurrences="71" value="je_" /> + <ngram occurrences="69" value="_i" /> + <ngram occurrences="66" value="g" /> + <ngram occurrences="61" value="_d" /> + <ngram occurrences="56" value="st" /> + <ngram occurrences="53" value="sy" /> + <ngram occurrences="51" value="na" /> + <ngram occurrences="51" value="cy" /> + <ngram occurrences="51" value="_j" /> + <ngram occurrences="49" value="ta" /> + <ngram occurrences="47" value="_u" /> + <ngram occurrences="46" value="po" /> + <ngram occurrences="46" value="_je" /> + <ngram occurrences="46" value="_b" /> + <ngram occurrences="44" value="os" /> + <ngram occurrences="44" value="da" /> + <ngram occurrences="43" value="ko" /> + <ngram occurrences="42" value="_o" /> + <ngram occurrences="41" value="ni" /> + <ngram occurrences="40" value="to" /> + <ngram occurrences="40" value="_po" /> + <ngram occurrences="39" value="no" /> + <ngram occurrences="39" value="m_" /> + <ngram occurrences="39" value="bi" /> + <ngram occurrences="38" value="ti" /> + <ngram occurrences="38" value="_je_" /> + <ngram occurrences="37" value="_m" /> + <ngram occurrences="36" value="ne" /> + <ngram occurrences="35" value="ra" /> + <ngram occurrences="35" value="is" /> + <ngram occurrences="35" value="an" /> + <ngram occurrences="35" value="_z" /> + <ngram occurrences="34" value="re" /> + <ngram occurrences="33" value="yi" /> + <ngram occurrences="33" value="n_" /> + <ngram occurrences="32" value="ov" /> + <ngram occurrences="32" value="na_" /> + <ngram occurrences="32" value="la" /> + <ngram occurrences="32" value="il" /> + <ngram occurrences="32" value="_t" /> + <ngram occurrences="31" value="li" /> + <ngram occurrences="31" value="en" /> + <ngram occurrences="31" value="_bi" /> + <ngram occurrences="30" value="vo" /> + <ngram occurrences="30" value="_k" /> + <ngram occurrences="29" value="og" /> + <ngram occurrences="29" value="lo" /> + <ngram occurrences="28" value="pr" /> + <ngram occurrences="28" value="ja" /> + <ngram occurrences="28" value="iz" /> + <ngram occurrences="28" value="da_" /> + <ngram occurrences="27" value="za" /> + <ngram occurrences="27" value="ro" /> + <ngram occurrences="27" value="on" /> + <ngram occurrences="27" value="in" /> + <ngram occurrences="27" value="ij" /> + <ngram occurrences="27" value="cj" /> + <ngram occurrences="27" value="_i_" /> + <ngram occurrences="26" value="om" /> + <ngram occurrences="26" value="oj" /> + <ngram occurrences="26" value="le" /> + <ngram occurrences="26" value="_pr" /> + <ngram occurrences="25" value="vi" /> + <ngram occurrences="25" value="nj" /> + <ngram occurrences="25" value="im" /> + <ngram occurrences="25" value="_v" /> + <ngram occurrences="25" value="_u_" /> + <ngram occurrences="25" value="_da" /> + <ngram occurrences="24" value="ve" /> + <ngram occurrences="24" value="a_i" /> + <ngram occurrences="24" value="_ne" /> + <ngram occurrences="23" value="va" /> + <ngram occurrences="23" value="od" /> + <ngram occurrences="23" value="cyi" /> + <ngram occurrences="23" value="av" /> + <ngram occurrences="23" value="ar" /> + <ngram occurrences="23" value="_za" /> + <ngram occurrences="23" value="_na" /> + <ngram occurrences="23" value="_iz" /> + <ngram occurrences="22" value="sa" /> + <ngram occurrences="22" value="ma" /> + <ngram occurrences="22" value="ka" /> + <ngram occurrences="22" value="ju" /> + <ngram occurrences="22" value="es" /> + <ngram occurrences="21" value="zy" /> + <ngram occurrences="21" value="to_" /> + <ngram occurrences="21" value="no_" /> + <ngram occurrences="21" value="mo" /> + <ngram occurrences="21" value="ed" /> + <ngram occurrences="21" value="ad" /> + <ngram occurrences="21" value="_da_" /> + <ngram occurrences="20" value="ti_" /> + <ngram occurrences="20" value="se" /> + <ngram occurrences="20" value="it" /> + <ngram occurrences="19" value="tr" /> + <ngram occurrences="19" value="do" /> + <ngram occurrences="19" value="de" /> + <ngram occurrences="19" value="al" /> + <ngram occurrences="19" value="ak" /> + <ngram occurrences="19" value="_na_" /> + <ngram occurrences="19" value="_c" /> + <ngram occurrences="18" value="yt" /> + <ngram occurrences="18" value="ta_" /> + <ngram occurrences="18" value="syt" /> + <ngram occurrences="18" value="om_" /> + <ngram occurrences="18" value="nu" /> + <ngram occurrences="18" value="lj" /> + <ngram occurrences="18" value="h" /> + <ngram occurrences="18" value="d_" /> + <ngram occurrences="18" value="a_p" /> + <ngram occurrences="18" value="a_n" /> + <ngram occurrences="18" value="_r" /> + <ngram occurrences="18" value="_ko" /> + <ngram occurrences="17" value="ri" /> + <ngram occurrences="17" value="ju_" /> + <ngram occurrences="17" value="go" /> + <ngram occurrences="17" value="et" /> + <ngram occurrences="17" value="ek" /> + <ngram occurrences="17" value="e_s" /> + <ngram occurrences="17" value="bil" /> + <ngram occurrences="17" value="ao_" /> + <ngram occurrences="17" value="ao" /> + <ngram occurrences="17" value="ac" /> + <ngram occurrences="17" value="a_s" /> + <ngram occurrences="17" value="_g" /> + <ngram occurrences="16" value="ye" /> + <ngram occurrences="16" value="sta" /> + <ngram occurrences="16" value="or" /> + <ngram occurrences="16" value="ob" /> + <ngram occurrences="16" value="ji" /> + <ngram occurrences="16" value="ik" /> + <ngram occurrences="16" value="ec" /> + <ngram occurrences="16" value="_bil" /> + <ngram occurrences="15" value="sto" /> + <ngram occurrences="15" value="ot" /> + <ngram occurrences="15" value="osy" /> + <ngram occurrences="15" value="o_d" /> + <ngram occurrences="15" value="lo_" /> + <ngram occurrences="15" value="la_" /> + <ngram occurrences="15" value="ije" /> + <ngram occurrences="15" value="i_s" /> + <ngram occurrences="15" value="e_n" /> + <ngram occurrences="15" value="_se" /> + <ngram occurrences="15" value="_sa" /> + <ngram occurrences="15" value="_do" /> + <ngram occurrences="15" value="_cy" /> + <ngram occurrences="14" value="te" /> + <ngram occurrences="14" value="pa" /> + <ngram occurrences="14" value="ost" /> + <ngram occurrences="14" value="o_s" /> + <ngram occurrences="14" value="koj" /> + <ngram occurrences="14" value="im_" /> + <ngram occurrences="14" value="ih" /> + <ngram occurrences="14" value="ic" /> + <ngram occurrences="14" value="e_b" /> + <ngram occurrences="14" value="at" /> + <ngram occurrences="14" value="a_j" /> + <ngram occurrences="14" value="_l" /> + <ngram occurrences="14" value="_a" /> + <ngram occurrences="13" value="su" /> + <ngram occurrences="13" value="sl" /> + <ngram occurrences="13" value="pos" /> + <ngram occurrences="13" value="ovo" /> + <ngram occurrences="13" value="on_" /> + <ngram occurrences="13" value="o_je" /> + <ngram occurrences="13" value="o_j" /> + <ngram occurrences="13" value="mi" /> + <ngram occurrences="13" value="ma_" /> + <ngram occurrences="13" value="li_" /> + <ngram occurrences="13" value="jo" /> + <ngram occurrences="13" value="iv" /> + <ngram occurrences="13" value="ih_" /> + <ngram occurrences="13" value="h_" /> + <ngram occurrences="13" value="ga" /> + <ngram occurrences="13" value="em" /> + <ngram occurrences="13" value="e_p" /> + <ngram occurrences="13" value="dn" /> + <ngram occurrences="13" value="a_je" /> + <ngram occurrences="13" value="_on" /> + <ngram occurrences="13" value="_ni" /> + <ngram occurrences="13" value="_mo" /> + <ngram occurrences="13" value="_koj" /> + <ngram occurrences="12" value="ut" /> + <ngram occurrences="12" value="u_n" /> + <ngram occurrences="12" value="se_" /> + <ngram occurrences="12" value="ol" /> + <ngram occurrences="12" value="me" /> + <ngram occurrences="12" value="ki" /> + <ngram occurrences="12" value="j_" /> + <ngram occurrences="12" value="i_p" /> + <ngram occurrences="12" value="e_u" /> + <ngram occurrences="12" value="e_bi" /> + <ngram occurrences="12" value="am" /> + <ngram occurrences="12" value="a_u" /> + <ngram occurrences="12" value="a_je_" /> + <ngram occurrences="12" value="a_i_" /> + <ngram occurrences="12" value="a_d" /> + <ngram occurrences="12" value="_to" /> + <ngram occurrences="12" value="_se_" /> + <ngram occurrences="12" value="_pos" /> + <ngram occurrences="12" value="_is" /> + <ngram occurrences="11" value="yn" /> + <ngram occurrences="11" value="uc" /> + <ngram occurrences="11" value="t_" /> + <ngram occurrences="11" value="o_p" /> + <ngram occurrences="11" value="o_je_" /> + <ngram occurrences="11" value="nje" /> + <ngram occurrences="11" value="je_bi" /> + <ngram occurrences="11" value="je_b" /> + <ngram occurrences="11" value="ja_" /> + <ngram occurrences="11" value="ist" /> + <ngram occurrences="11" value="io" /> + <ngram occurrences="11" value="ima" /> + <ngram occurrences="11" value="ije_" /> + <ngram occurrences="11" value="i_d" /> + <ngram occurrences="11" value="gl" /> + <ngram occurrences="11" value="ga_" /> + <ngram occurrences="11" value="az" /> + <ngram occurrences="11" value="_sy" /> + <ngram occurrences="10" value="za_" /> + <ngram occurrences="10" value="y_" /> + <ngram occurrences="10" value="u_s" /> + <ngram occurrences="10" value="sv" /> + <ngram occurrences="10" value="sti" /> + <ngram occurrences="10" value="pi" /> + <ngram occurrences="10" value="o_n" /> + <ngram occurrences="10" value="nos" /> + <ngram occurrences="10" value="ne_" /> + <ngram occurrences="10" value="ko_" /> + <ngram occurrences="10" value="k_" /> + <ngram occurrences="10" value="iti_" /> + <ngram occurrences="10" value="iti" /> + <ngram occurrences="10" value="io_" /> + <ngram occurrences="10" value="ima_" /> + <ngram occurrences="10" value="i_po" /> + <ngram occurrences="10" value="i_n" /> + <ngram occurrences="10" value="gu" /> + <ngram occurrences="10" value="br" /> + <ngram occurrences="10" value="ba" /> + <ngram occurrences="10" value="as" /> + <ngram occurrences="10" value="aj" /> + <ngram occurrences="10" value="acy" /> + <ngram occurrences="10" value="a_k" /> + <ngram occurrences="10" value="_za_" /> + <ngram occurrences="10" value="_ve" /> + <ngram occurrences="10" value="_sv" /> + <ngram occurrences="10" value="_no" /> + <ngram occurrences="10" value="_je_b" /> + <ngram occurrences="9" value="zn" /> + <ngram occurrences="9" value="z_" /> + <ngram occurrences="9" value="yl" /> + <ngram occurrences="9" value="yi_" /> + <ngram occurrences="9" value="up" /> + <ngram occurrences="9" value="su_" /> + <ngram occurrences="9" value="sk" /> + <ngram occurrences="9" value="s_" /> + <ngram occurrences="9" value="nij" /> + <ngram occurrences="9" value="ni_" /> + <ngram occurrences="9" value="le_" /> + <ngram occurrences="9" value="ke" /> + <ngram occurrences="9" value="je_s" /> + <ngram occurrences="9" value="iz_" /> + <ngram occurrences="9" value="ili" /> + <ngram occurrences="9" value="est" /> + <ngram occurrences="9" value="er" /> + <ngram occurrences="9" value="e_o" /> + <ngram occurrences="9" value="e_m" /> + <ngram occurrences="9" value="di" /> + <ngram occurrences="9" value="an_" /> + <ngram occurrences="9" value="a_b" /> + <ngram occurrences="9" value="_vi" /> + <ngram occurrences="9" value="_st" /> + <ngram occurrences="9" value="_re" /> + <ngram occurrences="8" value="yin" /> + <ngram occurrences="8" value="vr" /> + <ngram occurrences="8" value="va_" /> + <ngram occurrences="8" value="ucj" /> + <ngram occurrences="8" value="tu" /> + <ngram occurrences="8" value="te_" /> + <ngram occurrences="8" value="sy_" /> + <ngram occurrences="8" value="sp" /> + <ngram occurrences="8" value="pro" /> + <ngram occurrences="8" value="pre" /> + <ngram occurrences="8" value="ok" /> + <ngram occurrences="8" value="oc" /> + <ngram occurrences="8" value="o_b" /> + <ngram occurrences="8" value="nu_" /> + <ngram occurrences="8" value="nje_" /> + <ngram occurrences="8" value="lik" /> + <ngram occurrences="8" value="ka_" /> + <ngram occurrences="8" value="jen" /> + <ngram occurrences="8" value="je_n" /> + <ngram occurrences="8" value="jao_" /> + <ngram occurrences="8" value="jao" /> + <ngram occurrences="8" value="isy" /> + <ngram occurrences="8" value="ilo_" /> + <ngram occurrences="8" value="ilo" /> + <ngram occurrences="8" value="ila_" /> + <ngram occurrences="8" value="ila" /> + <ngram occurrences="8" value="esy" /> + <ngram occurrences="8" value="el" /> + <ngram occurrences="8" value="ecy" /> + <ngram occurrences="8" value="e_z" /> + <ngram occurrences="8" value="e_i" /> + <ngram occurrences="8" value="e_bil" /> + <ngram occurrences="8" value="de_" /> + <ngram occurrences="8" value="cje" /> + <ngram occurrences="8" value="anj" /> + <ngram occurrences="8" value="ad_" /> + <ngram occurrences="8" value="a_u_" /> + <ngram occurrences="8" value="a_pr" /> + <ngram occurrences="8" value="a_ko" /> + <ngram occurrences="8" value="a_iz" /> + <ngram occurrences="8" value="_zy" /> + <ngram occurrences="8" value="_tr" /> + <ngram occurrences="8" value="_su" /> + <ngram occurrences="8" value="_pro" /> + <ngram occurrences="8" value="_pre" /> + <ngram occurrences="8" value="_od" /> + <ngram occurrences="8" value="_ka" /> + <ngram occurrences="8" value="_iz_" /> + <ngram occurrences="8" value="_go" /> + <ngram occurrences="7" value="zyi" /> + <ngram occurrences="7" value="zna" /> + <ngram occurrences="7" value="yu" /> + <ngram occurrences="7" value="yto_" /> + <ngram occurrences="7" value="yto" /> + <ngram occurrences="7" value="ye_" /> + <ngram occurrences="7" value="vo_" /> + <ngram occurrences="7" value="u_p" /> + <ngram occurrences="7" value="u_i" /> + <ngram occurrences="7" value="tu_" /> + <ngram occurrences="7" value="syto_" /> + <ngram occurrences="7" value="syto" /> + <ngram occurrences="7" value="sam" /> + <ngram occurrences="7" value="ru" /> + <ngram occurrences="7" value="ren" /> + <ngram occurrences="7" value="recy" /> + <ngram occurrences="7" value="rec" /> + <ngram occurrences="7" value="pot" /> + <ngram occurrences="7" value="ovi" /> + <ngram occurrences="7" value="ora" /> + <ngram occurrences="7" value="odi" /> + <ngram occurrences="7" value="o_v" /> + <ngram occurrences="7" value="o_t" /> + <ngram occurrences="7" value="o_da" /> + <ngram occurrences="7" value="o_bi" /> + <ngram occurrences="7" value="nut" /> + <ngram occurrences="7" value="nji" /> + <ngram occurrences="7" value="nije" /> + <ngram occurrences="7" value="nek" /> + <ngram occurrences="7" value="mog" /> + <ngram occurrences="7" value="m_i" /> + <ngram occurrences="7" value="kom" /> + <ngram occurrences="7" value="jim" /> + <ngram occurrences="7" value="jed" /> + <ngram occurrences="7" value="je_u" /> + <ngram occurrences="7" value="icy" /> + <ngram occurrences="7" value="gov" /> + <ngram occurrences="7" value="ev" /> + <ngram occurrences="7" value="enu" /> + <ngram occurrences="7" value="eg" /> + <ngram occurrences="7" value="edn" /> + <ngram occurrences="7" value="ecj" /> + <ngram occurrences="7" value="e_po" /> + <ngram occurrences="7" value="e_j" /> + <ngram occurrences="7" value="du" /> + <ngram occurrences="7" value="dan" /> + <ngram occurrences="7" value="cyin" /> + <ngram occurrences="7" value="ci" /> +</ngrams> diff --git a/src/plugins/language/slovak.klp b/src/plugins/language/slovak.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="662" value="_" /> + <ngram occurrences="375" value="a" /> + <ngram occurrences="335" value="o" /> + <ngram occurrences="311" value="e" /> + <ngram occurrences="269" value="n" /> + <ngram occurrences="248" value="i" /> + <ngram occurrences="201" value="r" /> + <ngram occurrences="190" value="v" /> + <ngram occurrences="179" value="s" /> + <ngram occurrences="169" value="t" /> + <ngram occurrences="152" value="k" /> + <ngram occurrences="151" value="l" /> + <ngram occurrences="148" value="c" /> + <ngram occurrences="143" value="p" /> + <ngram occurrences="138" value="u" /> + <ngram occurrences="137" value="d" /> + <ngram occurrences="112" value="a_" /> + <ngram occurrences="108" value="y" /> + <ngram occurrences="96" value="m" /> + <ngram occurrences="92" value="h" /> + <ngram occurrences="83" value="e_" /> + <ngram occurrences="81" value="z" /> + <ngram occurrences="80" value="_p" /> + <ngram occurrences="79" value="na" /> + <ngram occurrences="69" value="_v" /> + <ngram occurrences="65" value="j" /> + <ngram occurrences="65" value="_s" /> + <ngram occurrences="61" value="ov" /> + <ngram occurrences="60" value="po" /> + <ngram occurrences="58" value="_n" /> + <ngram occurrences="57" value="i_" /> + <ngram occurrences="55" value="v_" /> + <ngram occurrences="53" value="u_" /> + <ngram occurrences="53" value="ro" /> + <ngram occurrences="53" value="b" /> + <ngram occurrences="51" value="o_" /> + <ngram occurrences="47" value="_na" /> + <ngram occurrences="46" value="ch" /> + <ngram occurrences="45" value="y_" /> + <ngram occurrences="43" value="ne" /> + <ngram occurrences="43" value="_a" /> + <ngram occurrences="41" value="en" /> + <ngram occurrences="41" value="_z" /> + <ngram occurrences="40" value="re" /> + <ngram occurrences="39" value="st" /> + <ngram occurrences="39" value="h_" /> + <ngram occurrences="38" value="la" /> + <ngram occurrences="38" value="an" /> + <ngram occurrences="37" value="_po" /> + <ngram occurrences="35" value="pr" /> + <ngram occurrences="34" value="ch_" /> + <ngram occurrences="34" value="_t" /> + <ngram occurrences="33" value="vy" /> + <ngram occurrences="32" value="ci" /> + <ngram occurrences="32" value="_v_" /> + <ngram occurrences="32" value="_o" /> + <ngram occurrences="31" value="od" /> + <ngram occurrences="31" value="na_" /> + <ngram occurrences="31" value="ie" /> + <ngram occurrences="31" value="_pr" /> + <ngram occurrences="30" value="ko" /> + <ngram occurrences="30" value="_m" /> + <ngram occurrences="29" value="sk" /> + <ngram occurrences="29" value="_k" /> + <ngram occurrences="28" value="ti" /> + <ngram occurrences="28" value="er" /> + <ngram occurrences="27" value="ve" /> + <ngram occurrences="27" value="al" /> + <ngram occurrences="27" value="_r" /> + <ngram occurrences="26" value="ra" /> + <ngram occurrences="26" value="or" /> + <ngram occurrences="26" value="ni" /> + <ngram occurrences="26" value="in" /> + <ngram occurrences="26" value="ed" /> + <ngram occurrences="25" value="yc" /> + <ngram occurrences="25" value="va" /> + <ngram occurrences="25" value="ny" /> + <ngram occurrences="25" value="mi" /> + <ngram occurrences="25" value="ak" /> + <ngram occurrences="24" value="ych" /> + <ngram occurrences="24" value="to" /> + <ngram occurrences="24" value="le" /> + <ngram occurrences="24" value="ho" /> + <ngram occurrences="24" value="ce" /> + <ngram occurrences="24" value="ad" /> + <ngram occurrences="24" value="ac" /> + <ngram occurrences="24" value="_na_" /> + <ngram occurrences="24" value="_d" /> + <ngram occurrences="23" value="tr" /> + <ngram occurrences="23" value="t_" /> + <ngram occurrences="23" value="si" /> + <ngram occurrences="23" value="ov_" /> + <ngram occurrences="23" value="ka" /> + <ngram occurrences="23" value="_c" /> + <ngram occurrences="22" value="ych_" /> + <ngram occurrences="22" value="no" /> + <ngram occurrences="22" value="li" /> + <ngram occurrences="22" value="il" /> + <ngram occurrences="22" value="_u" /> + <ngram occurrences="21" value="te" /> + <ngram occurrences="21" value="sa" /> + <ngram occurrences="21" value="ok" /> + <ngram occurrences="20" value="os" /> + <ngram occurrences="20" value="om" /> + <ngram occurrences="20" value="it" /> + <ngram occurrences="20" value="do" /> + <ngram occurrences="19" value="za" /> + <ngram occurrences="19" value="ta" /> + <ngram occurrences="19" value="me" /> + <ngram occurrences="19" value="l_" /> + <ngram occurrences="19" value="ku" /> + <ngram occurrences="19" value="ia" /> + <ngram occurrences="19" value="da" /> + <ngram occurrences="19" value="_b" /> + <ngram occurrences="18" value="pre" /> + <ngram occurrences="18" value="m_" /> + <ngram occurrences="18" value="es" /> + <ngram occurrences="18" value="a_p" /> + <ngram occurrences="18" value="_a_" /> + <ngram occurrences="17" value="oc" /> + <ngram occurrences="17" value="ej" /> + <ngram occurrences="17" value="aj" /> + <ngram occurrences="17" value="_sa" /> + <ngram occurrences="17" value="_pre" /> + <ngram occurrences="16" value="ur" /> + <ngram occurrences="16" value="r_" /> + <ngram occurrences="16" value="on" /> + <ngram occurrences="16" value="ol" /> + <ngram occurrences="16" value="lo" /> + <ngram occurrences="16" value="ky" /> + <ngram occurrences="16" value="j_" /> + <ngram occurrences="16" value="el" /> + <ngram occurrences="16" value="at" /> + <ngram occurrences="16" value="ap" /> + <ngram occurrences="16" value="_za" /> + <ngram occurrences="16" value="_vy" /> + <ngram occurrences="15" value="vo" /> + <ngram occurrences="15" value="sa_" /> + <ngram occurrences="15" value="rok" /> + <ngram occurrences="15" value="ri" /> + <ngram occurrences="15" value="ne_" /> + <ngram occurrences="15" value="ic" /> + <ngram occurrences="15" value="f" /> + <ngram occurrences="15" value="av" /> + <ngram occurrences="15" value="as" /> + <ngram occurrences="15" value="_ro" /> + <ngram occurrences="15" value="_j" /> + <ngram occurrences="14" value="zi" /> + <ngram occurrences="14" value="ob" /> + <ngram occurrences="14" value="nych_" /> + <ngram occurrences="14" value="nych" /> + <ngram occurrences="14" value="nyc" /> + <ngram occurrences="14" value="ke" /> + <ngram occurrences="14" value="k_" /> + <ngram occurrences="14" value="eh" /> + <ngram occurrences="14" value="d_" /> + <ngram occurrences="14" value="_sa_" /> + <ngram occurrences="13" value="v_p" /> + <ngram occurrences="13" value="us" /> + <ngram occurrences="13" value="pod" /> + <ngram occurrences="13" value="ot" /> + <ngram occurrences="13" value="nu" /> + <ngram occurrences="13" value="ln" /> + <ngram occurrences="13" value="ie_" /> + <ngram occurrences="13" value="ho_" /> + <ngram occurrences="13" value="eho_" /> + <ngram occurrences="13" value="eho" /> + <ngram occurrences="13" value="e_v" /> + <ngram occurrences="13" value="dn" /> + <ngram occurrences="13" value="di" /> + <ngram occurrences="13" value="de" /> + <ngram occurrences="13" value="co" /> + <ngram occurrences="13" value="am" /> + <ngram occurrences="13" value="a_v" /> + <ngram occurrences="13" value="_do" /> + <ngram occurrences="12" value="sp" /> + <ngram occurrences="12" value="rov" /> + <ngram occurrences="12" value="pa" /> + <ngram occurrences="12" value="nt" /> + <ngram occurrences="12" value="n_" /> + <ngram occurrences="12" value="li_" /> + <ngram occurrences="12" value="g" /> + <ngram occurrences="12" value="ar" /> + <ngram occurrences="12" value="a_n" /> + <ngram occurrences="12" value="_ak" /> + <ngram occurrences="11" value="zn" /> + <ngram occurrences="11" value="vi" /> + <ngram occurrences="11" value="om_" /> + <ngram occurrences="11" value="ny_" /> + <ngram occurrences="11" value="la_" /> + <ngram occurrences="11" value="ky_" /> + <ngram occurrences="11" value="kt" /> + <ngram occurrences="11" value="em" /> + <ngram occurrences="11" value="ej_" /> + <ngram occurrences="11" value="e_p" /> + <ngram occurrences="11" value="e_n" /> + <ngram occurrences="11" value="az" /> + <ngram occurrences="11" value="a_s" /> + <ngram occurrences="11" value="_tr" /> + <ngram occurrences="11" value="_pod" /> + <ngram occurrences="11" value="_h" /> + <ngram occurrences="11" value="_ce" /> + <ngram occurrences="10" value="zv" /> + <ngram occurrences="10" value="z_" /> + <ngram occurrences="10" value="pe" /> + <ngram occurrences="10" value="oz" /> + <ngram occurrences="10" value="ovy" /> + <ngram occurrences="10" value="ove" /> + <ngram occurrences="10" value="ova" /> + <ngram occurrences="10" value="nc" /> + <ngram occurrences="10" value="nan" /> + <ngram occurrences="10" value="ka_" /> + <ngram occurrences="10" value="ju" /> + <ngram occurrences="10" value="ik" /> + <ngram occurrences="10" value="ek" /> + <ngram occurrences="10" value="du" /> + <ngram occurrences="10" value="cen" /> + <ngram occurrences="10" value="ast" /> + <ngram occurrences="10" value="a_po" /> + <ngram occurrences="10" value="a_na" /> + <ngram occurrences="10" value="_ob" /> + <ngram occurrences="10" value="_l" /> + <ngram occurrences="10" value="_i" /> + <ngram occurrences="10" value="_e" /> + <ngram occurrences="9" value="uro" /> + <ngram occurrences="9" value="tor" /> + <ngram occurrences="9" value="ti_" /> + <ngram occurrences="9" value="ska" /> + <ngram occurrences="9" value="ru" /> + <ngram occurrences="9" value="pri" /> + <ngram occurrences="9" value="pl" /> + <ngram occurrences="9" value="nu_" /> + <ngram occurrences="9" value="mo" /> + <ngram occurrences="9" value="lad" /> + <ngram occurrences="9" value="ku_" /> + <ngram occurrences="9" value="kov" /> + <ngram occurrences="9" value="kl" /> + <ngram occurrences="9" value="je" /> + <ngram occurrences="9" value="ja" /> + <ngram occurrences="9" value="iv" /> + <ngram occurrences="9" value="i_s" /> + <ngram occurrences="9" value="cov" /> + <ngram occurrences="9" value="_v_p" /> + <ngram occurrences="9" value="_ne" /> + <ngram occurrences="9" value="_mi" /> + <ngram occurrences="8" value="ze" /> + <ngram occurrences="8" value="ys" /> + <ngram occurrences="8" value="vys" /> + <ngram occurrences="8" value="vn" /> + <ngram occurrences="8" value="uc" /> + <ngram occurrences="8" value="tu" /> + <ngram occurrences="8" value="trh" /> + <ngram occurrences="8" value="su" /> + <ngram occurrences="8" value="st_" /> + <ngram occurrences="8" value="sl" /> + <ngram occurrences="8" value="ske" /> + <ngram occurrences="8" value="rh" /> + <ngram occurrences="8" value="red" /> + <ngram occurrences="8" value="pred" /> + <ngram occurrences="8" value="nej" /> + <ngram occurrences="8" value="mi_" /> + <ngram occurrences="8" value="ina" /> + <ngram occurrences="8" value="il_" /> + <ngram occurrences="8" value="ia_" /> + <ngram occurrences="8" value="et" /> + <ngram occurrences="8" value="est" /> + <ngram occurrences="8" value="er_" /> + <ngram occurrences="8" value="ent" /> + <ngram occurrences="8" value="en_" /> + <ngram occurrences="8" value="e_s" /> + <ngram occurrences="8" value="ca" /> + <ngram occurrences="8" value="ani" /> + <ngram occurrences="8" value="a_t" /> + <ngram occurrences="8" value="_zv" /> + <ngram occurrences="8" value="_ur" /> + <ngram occurrences="8" value="_trh" /> + <ngram occurrences="8" value="_st" /> + <ngram occurrences="8" value="_sp" /> + <ngram occurrences="8" value="_rok" /> + <ngram occurrences="8" value="_pri" /> + <ngram occurrences="8" value="_pred" /> + <ngram occurrences="8" value="_me" /> + <ngram occurrences="7" value="van" /> + <ngram occurrences="7" value="v_o" /> + <ngram occurrences="7" value="usd_" /> + <ngram occurrences="7" value="usd" /> + <ngram occurrences="7" value="up" /> + <ngram occurrences="7" value="uj" /> + <ngram occurrences="7" value="ud" /> + <ngram occurrences="7" value="u_a" /> + <ngram occurrences="7" value="to_" /> + <ngram occurrences="7" value="te_" /> + <ngram occurrences="7" value="sti" /> + <ngram occurrences="7" value="sta" /> + <ngram occurrences="7" value="spo" /> + <ngram occurrences="7" value="sil" /> + <ngram occurrences="7" value="sd_" /> + <ngram occurrences="7" value="sd" /> + <ngram occurrences="7" value="ost" /> + <ngram occurrences="7" value="oro" /> + <ngram occurrences="7" value="o_v" /> + <ngram occurrences="7" value="ns" /> + <ngram occurrences="7" value="nej_" /> + <ngram occurrences="7" value="neho_" /> + <ngram occurrences="7" value="neho" /> + <ngram occurrences="7" value="neh" /> + <ngram occurrences="7" value="naj" /> + <ngram occurrences="7" value="na_t" /> + <ngram occurrences="7" value="kci" /> + <ngram occurrences="7" value="kc" /> + <ngram occurrences="7" value="je_" /> + <ngram occurrences="7" value="is" /> + <ngram occurrences="7" value="hod" /> + <ngram occurrences="7" value="ep" /> + <ngram occurrences="7" value="eni" /> + <ngram occurrences="7" value="ec" /> + <ngram occurrences="7" value="du_" /> + <ngram occurrences="7" value="br" /> + <ngram occurrences="7" value="ati" /> + <ngram occurrences="7" value="ali" /> + <ngram occurrences="7" value="akci" /> + <ngram occurrences="7" value="akc" /> + <ngram occurrences="7" value="a_u" /> + <ngram occurrences="7" value="_usd_" /> + <ngram occurrences="7" value="_usd" /> + <ngram occurrences="7" value="_us" /> + <ngram occurrences="7" value="_uro" /> + <ngram occurrences="7" value="_su" /> + <ngram occurrences="7" value="_sk" /> + <ngram occurrences="7" value="_naj" /> + <ngram occurrences="7" value="_na_t" /> + <ngram occurrences="7" value="_in" /> + <ngram occurrences="7" value="_f" /> + <ngram occurrences="7" value="_cen" /> + <ngram occurrences="7" value="_akci" /> + <ngram occurrences="7" value="_akc" /> + <ngram occurrences="6" value="zac" /> + <ngram occurrences="6" value="y_p" /> + <ngram occurrences="6" value="y_a" /> + <ngram occurrences="6" value="vl" /> + <ngram occurrences="6" value="v_po" /> + <ngram occurrences="6" value="uk" /> + <ngram occurrences="6" value="u_p" /> + <ngram occurrences="6" value="u_n" /> + <ngram occurrences="6" value="u_a_" /> + <ngram occurrences="6" value="ty" /> + <ngram occurrences="6" value="tre" /> + <ngram occurrences="6" value="tn" /> + <ngram occurrences="6" value="tiv" /> + <ngram occurrences="6" value="sti_" /> + <ngram occurrences="6" value="ska_" /> + <ngram occurrences="6" value="sia" /> + <ngram occurrences="6" value="se" /> + <ngram occurrences="6" value="s_" /> + <ngram occurrences="6" value="roku_" /> + <ngram occurrences="6" value="roku" /> + <ngram occurrences="6" value="rod" /> + <ngram occurrences="6" value="ri_" /> + <ngram occurrences="6" value="re_" /> + <ngram occurrences="6" value="pos" /> + <ngram occurrences="6" value="por" /> + <ngram occurrences="6" value="otr" /> + <ngram occurrences="6" value="osl" /> + <ngram occurrences="6" value="ore" /> + <ngram occurrences="6" value="oku_" /> + <ngram occurrences="6" value="oku" /> + <ngram occurrences="6" value="odn" /> + <ngram occurrences="6" value="o_z" /> + <ngram occurrences="6" value="o_s" /> + <ngram occurrences="6" value="nsk" /> + <ngram occurrences="6" value="nov" /> + <ngram occurrences="6" value="ni_" /> + <ngram occurrences="6" value="mu" /> + <ngram occurrences="6" value="mie" /> + <ngram occurrences="6" value="ly" /> + <ngram occurrences="6" value="kon" /> + <ngram occurrences="6" value="ke_" /> + <ngram occurrences="6" value="iny_" /> + <ngram occurrences="6" value="iny" /> + <ngram occurrences="6" value="ii_" /> + <ngram occurrences="6" value="ii" /> + <ngram occurrences="6" value="id" /> + <ngram occurrences="6" value="i_v" /> + <ngram occurrences="6" value="i_n" /> + <ngram occurrences="6" value="hr" /> + <ngram occurrences="6" value="he" /> + <ngram occurrences="6" value="ele" /> + <ngram occurrences="6" value="eb" /> + <ngram occurrences="6" value="e_v_" /> + <ngram occurrences="6" value="e_po" /> + <ngram occurrences="6" value="e_na" /> + <ngram occurrences="6" value="e_m" /> + <ngram occurrences="6" value="cov_" /> + <ngram occurrences="6" value="cii_" /> + <ngram occurrences="6" value="cii" /> + <ngram occurrences="6" value="cie" /> + <ngram occurrences="6" value="cho" /> + <ngram occurrences="6" value="by" /> + <ngram occurrences="6" value="ast_" /> + <ngram occurrences="6" value="alo" /> +</ngrams> diff --git a/src/plugins/language/slovak2.klp b/src/plugins/language/slovak2.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="701" value="_" /> + <ngram occurrences="379" value="o" /> + <ngram occurrences="334" value="a" /> + <ngram occurrences="287" value="e" /> + <ngram occurrences="240" value="i" /> + <ngram occurrences="237" value="n" /> + <ngram occurrences="217" value="v" /> + <ngram occurrences="198" value="r" /> + <ngram occurrences="194" value="t" /> + <ngram occurrences="177" value="s" /> + <ngram occurrences="139" value="d" /> + <ngram occurrences="137" value="p" /> + <ngram occurrences="132" value="m" /> + <ngram occurrences="130" value="k" /> + <ngram occurrences="125" value="a_" /> + <ngram occurrences="122" value="l" /> + <ngram occurrences="95" value="u" /> + <ngram occurrences="93" value="c" /> + <ngram occurrences="90" value="_p" /> + <ngram occurrences="88" value="h" /> + <ngram occurrences="87" value="_v" /> + <ngram occurrences="79" value="z" /> + <ngram occurrences="77" value="j" /> + <ngram occurrences="76" value="e_" /> + <ngram occurrences="74" value="á" /> + <ngram occurrences="67" value="b" /> + <ngram occurrences="63" value="st" /> + <ngram occurrences="63" value="pr" /> + <ngram occurrences="61" value="_s" /> + <ngram occurrences="58" value="y" /> + <ngram occurrences="55" value="o_" /> + <ngram occurrences="55" value="_pr" /> + <ngram occurrences="54" value="ov" /> + <ngram occurrences="54" value="i_" /> + <ngram occurrences="54" value="_a" /> + <ngram occurrences="52" value="v_" /> + <ngram occurrences="49" value="_n" /> + <ngram occurrences="46" value="è" /> + <ngram occurrences="43" value="ý" /> + <ngram occurrences="43" value="an" /> + <ngram occurrences="42" value="í" /> + <ngram occurrences="42" value="re" /> + <ngram occurrences="42" value="po" /> + <ngram occurrences="41" value="u_" /> + <ngram occurrences="41" value="ch" /> + <ngram occurrences="41" value="_o" /> + <ngram occurrences="40" value="to" /> + <ngram occurrences="40" value="m_" /> + <ngram occurrences="39" value="ne" /> + <ngram occurrences="38" value="ni" /> + <ngram occurrences="37" value="os" /> + <ngram occurrences="37" value="ed" /> + <ngram occurrences="37" value="_z" /> + <ngram occurrences="35" value="or" /> + <ngram occurrences="34" value="va" /> + <ngram occurrences="34" value="na" /> + <ngram occurrences="34" value="h_" /> + <ngram occurrences="34" value="ch_" /> + <ngram occurrences="33" value="ro" /> + <ngram occurrences="33" value="om" /> + <ngram occurrences="33" value="ko" /> + <ngram occurrences="33" value="ie" /> + <ngram occurrences="33" value="_m" /> + <ngram occurrences="32" value="ú" /> + <ngram occurrences="32" value="do" /> + <ngram occurrences="32" value="_v_" /> + <ngram occurrences="31" value="_t" /> + <ngram occurrences="31" value="_k" /> + <ngram occurrences="30" value="no" /> + <ngram occurrences="29" value="é" /> + <ngram occurrences="28" value="li" /> + <ngram occurrences="28" value="_po" /> + <ngram occurrences="28" value="_a_" /> + <ngram occurrences="27" value="y_" /> + <ngram occurrences="27" value="pre" /> + <ngram occurrences="27" value="j_" /> + <ngram occurrences="27" value="ia" /> + <ngram occurrences="27" value="ho" /> + <ngram occurrences="27" value="en" /> + <ngram occurrences="27" value="_pre" /> + <ngram occurrences="25" value="ti" /> + <ngram occurrences="25" value="od" /> + <ngram occurrences="25" value="la" /> + <ngram occurrences="24" value="ra" /> + <ngram occurrences="24" value="ci" /> + <ngram occurrences="24" value="_d" /> + <ngram occurrences="23" value="ob" /> + <ngram occurrences="23" value="aj" /> + <ngram occurrences="23" value="_i" /> + <ngram occurrences="22" value="va_" /> + <ngram occurrences="22" value="te" /> + <ngram occurrences="21" value="vo" /> + <ngram occurrences="21" value="vi" /> + <ngram occurrences="21" value="ve" /> + <ngram occurrences="21" value="s_" /> + <ngram occurrences="21" value="ova" /> + <ngram occurrences="21" value="ej" /> + <ngram occurrences="21" value="de" /> + <ngram occurrences="21" value="_e" /> + <ngram occurrences="20" value="ta" /> + <ngram occurrences="20" value="av" /> + <ngram occurrences="20" value="a_p" /> + <ngram occurrences="20" value="_na" /> + <ngram occurrences="19" value="ol" /> + <ngram occurrences="19" value="mi" /> + <ngram occurrences="19" value="kt" /> + <ngram occurrences="19" value="ic" /> + <ngram occurrences="18" value="vy" /> + <ngram occurrences="18" value="ov_" /> + <ngram occurrences="18" value="on" /> + <ngram occurrences="18" value="om_" /> + <ngram occurrences="18" value="me" /> + <ngram occurrences="18" value="je" /> + <ngram occurrences="18" value="_ne" /> + <ngram occurrences="17" value="í_" /> + <ngram occurrences="17" value="ri" /> + <ngram occurrences="17" value="red" /> + <ngram occurrences="17" value="r_" /> + <ngram occurrences="17" value="pred" /> + <ngram occurrences="17" value="na_" /> + <ngram occurrences="17" value="g" /> + <ngram occurrences="17" value="ak" /> + <ngram occurrences="17" value="_pred" /> + <ngram occurrences="17" value="_b" /> + <ngram occurrences="16" value="oz" /> + <ngram occurrences="16" value="ma" /> + <ngram occurrences="16" value="li_" /> + <ngram occurrences="16" value="it" /> + <ngram occurrences="16" value="er" /> + <ngram occurrences="16" value="ej_" /> + <ngram occurrences="16" value="ar" /> + <ngram occurrences="16" value="_vy" /> + <ngram occurrences="15" value="sta" /> + <ngram occurrences="15" value="sl" /> + <ngram occurrences="15" value="ova_" /> + <ngram occurrences="15" value="ost" /> + <ngram occurrences="15" value="kto" /> + <ngram occurrences="15" value="in" /> + <ngram occurrences="15" value="ho_" /> + <ngram occurrences="15" value="et" /> + <ngram occurrences="15" value="at" /> + <ngram occurrences="15" value="al" /> + <ngram occurrences="15" value="a_n" /> + <ngram occurrences="14" value="ÿ" /> + <ngram occurrences="14" value="èi" /> + <ngram occurrences="14" value="tor" /> + <ngram occurrences="14" value="ne_" /> + <ngram occurrences="14" value="le" /> + <ngram occurrences="14" value="ie_" /> + <ngram occurrences="14" value="_c" /> + <ngram occurrences="13" value="ých_" /> + <ngram occurrences="13" value="ých" /> + <ngram occurrences="13" value="ýc" /> + <ngram occurrences="13" value="é_" /> + <ngram occurrences="13" value="zá" /> + <ngram occurrences="13" value="tr" /> + <ngram occurrences="13" value="mo" /> + <ngram occurrences="13" value="lo" /> + <ngram occurrences="13" value="l_" /> + <ngram occurrences="13" value="ia_" /> + <ngram occurrences="13" value="f" /> + <ngram occurrences="13" value="edo" /> + <ngram occurrences="13" value="ani" /> + <ngram occurrences="13" value="_è" /> + <ngram occurrences="13" value="_r" /> + <ngram occurrences="13" value="_kto" /> + <ngram occurrences="13" value="_kt" /> + <ngram occurrences="13" value="_j" /> + <ngram occurrences="13" value="_ak" /> + <ngram occurrences="12" value="ý_" /> + <ngram occurrences="12" value="èa" /> + <ngram occurrences="12" value="zo" /> + <ngram occurrences="12" value="tu" /> + <ngram occurrences="12" value="to_" /> + <ngram occurrences="12" value="ti_" /> + <ngram occurrences="12" value="sk" /> + <ngram occurrences="12" value="sa" /> + <ngram occurrences="12" value="ot" /> + <ngram occurrences="12" value="nos" /> + <ngram occurrences="12" value="ktor" /> + <ngram occurrences="12" value="ka" /> + <ngram occurrences="12" value="il" /> + <ngram occurrences="12" value="de_" /> + <ngram occurrences="12" value="ad" /> + <ngram occurrences="12" value="a_s" /> + <ngram occurrences="12" value="_ma" /> + <ngram occurrences="12" value="_ktor" /> + <ngram occurrences="12" value="_h" /> + <ngram occurrences="11" value="ým" /> + <ngram occurrences="11" value="ál" /> + <ngram occurrences="11" value="vl" /> + <ngram occurrences="11" value="tn" /> + <ngram occurrences="11" value="rn" /> + <ngram occurrences="11" value="os_" /> + <ngram occurrences="11" value="ok" /> + <ngram occurrences="11" value="ný" /> + <ngram occurrences="11" value="né" /> + <ngram occurrences="11" value="ná" /> + <ngram occurrences="11" value="nie" /> + <ngram occurrences="11" value="e_p" /> + <ngram occurrences="11" value="ds" /> + <ngram occurrences="11" value="di" /> + <ngram occurrences="11" value="as" /> + <ngram occurrences="11" value="a_pr" /> + <ngram occurrences="11" value="_vl" /> + <ngram occurrences="11" value="_st" /> + <ngram occurrences="11" value="_ob" /> + <ngram occurrences="10" value="ým_" /> + <ngram occurrences="10" value="ú_" /> + <ngram occurrences="10" value="á_" /> + <ngram occurrences="10" value="z_" /> + <ngram occurrences="10" value="ud" /> + <ngram occurrences="10" value="tav" /> + <ngram occurrences="10" value="stav" /> + <ngram occurrences="10" value="pro" /> + <ngram occurrences="10" value="pra" /> + <ngram occurrences="10" value="oj" /> + <ngram occurrences="10" value="kon" /> + <ngram occurrences="10" value="k_" /> + <ngram occurrences="10" value="i_p" /> + <ngram occurrences="10" value="eè" /> + <ngram occurrences="10" value="bud" /> + <ngram occurrences="10" value="bu" /> + <ngram occurrences="10" value="a_v" /> + <ngram occurrences="10" value="a_o" /> + <ngram occurrences="10" value="_ve" /> + <ngram occurrences="10" value="_u" /> + <ngram occurrences="10" value="_od" /> + <ngram occurrences="10" value="_na_" /> + <ngram occurrences="10" value="_do" /> + <ngram occurrences="10" value="_bud" /> + <ngram occurrences="10" value="_bu" /> + <ngram occurrences="9" value="èe" /> + <ngram occurrences="9" value="ác" /> + <ngram occurrences="9" value="ved" /> + <ngram occurrences="9" value="v_m" /> + <ngram occurrences="9" value="tá" /> + <ngram occurrences="9" value="t_" /> + <ngram occurrences="9" value="so" /> + <ngram occurrences="9" value="ran" /> + <ngram occurrences="9" value="pe" /> + <ngram occurrences="9" value="ou_" /> + <ngram occurrences="9" value="ou" /> + <ngram occurrences="9" value="o_v" /> + <ngram occurrences="9" value="ných_" /> + <ngram occurrences="9" value="ných" /> + <ngram occurrences="9" value="nýc" /> + <ngram occurrences="9" value="ní" /> + <ngram occurrences="9" value="ny" /> + <ngram occurrences="9" value="n_" /> + <ngram occurrences="9" value="lá" /> + <ngram occurrences="9" value="ln" /> + <ngram occurrences="9" value="ky_" /> + <ngram occurrences="9" value="ky" /> + <ngram occurrences="9" value="ko_" /> + <ngram occurrences="9" value="je_" /> + <ngram occurrences="9" value="is" /> + <ngram occurrences="9" value="ich_" /> + <ngram occurrences="9" value="ich" /> + <ngram occurrences="9" value="es" /> + <ngram occurrences="9" value="em" /> + <ngram occurrences="9" value="e_v" /> + <ngram occurrences="9" value="e_n" /> + <ngram occurrences="9" value="dom" /> + <ngram occurrences="9" value="aj_" /> + <ngram occurrences="9" value="a_d" /> + <ngram occurrences="9" value="_zá" /> + <ngram occurrences="9" value="_sa" /> + <ngram occurrences="9" value="_pro" /> + <ngram occurrences="9" value="_e_" /> + <ngram occurrences="8" value="ò" /> + <ngram occurrences="8" value="áv" /> + <ngram occurrences="8" value="át" /> + <ngram occurrences="8" value="za" /> + <ngram occurrences="8" value="u_kto" /> + <ngram occurrences="8" value="u_kt" /> + <ngram occurrences="8" value="u_k" /> + <ngram occurrences="8" value="tu_" /> + <ngram occurrences="8" value="sv" /> + <ngram occurrences="8" value="str" /> + <ngram occurrences="8" value="sa_" /> + <ngram occurrences="8" value="rá" /> + <ngram occurrences="8" value="redst" /> + <ngram occurrences="8" value="reds" /> + <ngram occurrences="8" value="preds" /> + <ngram occurrences="8" value="pos" /> + <ngram occurrences="8" value="pod" /> + <ngram occurrences="8" value="omi" /> + <ngram occurrences="8" value="né_" /> + <ngram occurrences="8" value="nov" /> + <ngram occurrences="8" value="nom" /> + <ngram occurrences="8" value="m_v" /> + <ngram occurrences="8" value="m_p" /> + <ngram occurrences="8" value="iá" /> + <ngram occurrences="8" value="iz" /> + <ngram occurrences="8" value="ili" /> + <ngram occurrences="8" value="ik" /> + <ngram occurrences="8" value="i_v" /> + <ngram occurrences="8" value="hr" /> + <ngram occurrences="8" value="eni" /> + <ngram occurrences="8" value="edsta" /> + <ngram occurrences="8" value="edst" /> + <ngram occurrences="8" value="eds" /> + <ngram occurrences="8" value="eb" /> + <ngram occurrences="8" value="e_a" /> + <ngram occurrences="8" value="dstav" /> + <ngram occurrences="8" value="dsta" /> + <ngram occurrences="8" value="dst" /> + <ngram occurrences="8" value="dn" /> + <ngram occurrences="8" value="da" /> + <ngram occurrences="8" value="ck" /> + <ngram occurrences="8" value="bo" /> + <ngram occurrences="8" value="am" /> + <ngram occurrences="8" value="ako_" /> + <ngram occurrences="8" value="ako" /> + <ngram occurrences="8" value="a_po" /> + <ngram occurrences="8" value="_z_" /> + <ngram occurrences="8" value="_v_m" /> + <ngram occurrences="8" value="_pos" /> + <ngram occurrences="8" value="_me" /> + <ngram occurrences="8" value="_je" /> + <ngram occurrences="8" value="_f" /> + <ngram occurrences="8" value="_ako_" /> + <ngram occurrences="8" value="_ako" /> + <ngram occurrences="8" value="_a_o" /> + <ngram occurrences="7" value="ého" /> + <ngram occurrences="7" value="éh" /> + <ngram occurrences="7" value="èn" /> + <ngram occurrences="7" value="ä" /> + <ngram occurrences="7" value="áln" /> + <ngram occurrences="7" value="ád" /> + <ngram occurrences="7" value="vý" /> + <ngram occurrences="7" value="vu" /> + <ngram occurrences="7" value="vn" /> + <ngram occurrences="7" value="vlád" /> + <ngram occurrences="7" value="vlá" /> + <ngram occurrences="7" value="vi_" /> + <ngram occurrences="7" value="v_me" /> + <ngram occurrences="7" value="v_etk" /> + <ngram occurrences="7" value="v_et" /> + <ngram occurrences="7" value="v_e" /> + <ngram occurrences="7" value="uje" /> + <ngram occurrences="7" value="uj" /> + <ngram occurrences="7" value="ude_" /> + <ngram occurrences="7" value="ude" /> + <ngram occurrences="7" value="tk" /> + <ngram occurrences="7" value="sú" /> + <ngram occurrences="7" value="sto" /> + <ngram occurrences="7" value="sti" /> + <ngram occurrences="7" value="rov" /> + <ngram occurrences="7" value="pri" /> + <ngram occurrences="7" value="orn" /> + <ngram occurrences="7" value="op" /> + <ngram occurrences="7" value="ns" /> + <ngram occurrences="7" value="nos_" /> + <ngram occurrences="7" value="nie_" /> + <ngram occurrences="7" value="m_pr" /> + <ngram occurrences="7" value="lád" /> + <ngram occurrences="7" value="ký" /> + <ngram occurrences="7" value="kr" /> + <ngram occurrences="7" value="jm" /> + <ngram occurrences="7" value="iv" /> + <ngram occurrences="7" value="ite" /> + <ngram occurrences="7" value="ga" /> + <ngram occurrences="7" value="eÿ" /> + <ngram occurrences="7" value="etk" /> + <ngram occurrences="7" value="eho_" /> + <ngram occurrences="7" value="eho" /> + <ngram occurrences="7" value="eh" /> + <ngram occurrences="7" value="e_s" /> + <ngram occurrences="7" value="bè" /> + <ngram occurrences="7" value="bude_" /> + <ngram occurrences="7" value="bude" /> + <ngram occurrences="7" value="be" /> + <ngram occurrences="7" value="avi" /> + <ngram occurrences="7" value="ate" /> + <ngram occurrences="7" value="a_a" /> + <ngram occurrences="7" value="_vlád" /> + <ngram occurrences="7" value="_vlá" /> + <ngram occurrences="7" value="_v_me" /> + <ngram occurrences="7" value="_sú" /> + <ngram occurrences="7" value="_sv" /> + <ngram occurrences="7" value="_sa_" /> + <ngram occurrences="7" value="_ro" /> + <ngram occurrences="7" value="_pri" /> + <ngram occurrences="7" value="_pod" /> + <ngram occurrences="7" value="_or" /> + <ngram occurrences="7" value="_ko" /> + <ngram occurrences="7" value="_ka" /> + <ngram occurrences="7" value="_etk" /> + <ngram occurrences="7" value="_et" /> + <ngram occurrences="7" value="_bude" /> + <ngram occurrences="7" value="_a_p" /> + <ngram occurrences="6" value="ÿov" /> + <ngram occurrences="6" value="ÿo" /> + <ngram occurrences="6" value="ÿa" /> + <ngram occurrences="6" value="úc" /> + <ngram occurrences="6" value="ís" /> + <ngram occurrences="6" value="ém" /> + <ngram occurrences="6" value="ého_" /> +</ngrams> diff --git a/src/plugins/language/slovenian.klp b/src/plugins/language/slovenian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="793" value="_" /> + <ngram occurrences="433" value="e" /> + <ngram occurrences="410" value="a" /> + <ngram occurrences="356" value="o" /> + <ngram occurrences="347" value="i" /> + <ngram occurrences="285" value="n" /> + <ngram occurrences="207" value="r" /> + <ngram occurrences="205" value="s" /> + <ngram occurrences="200" value="l" /> + <ngram occurrences="181" value="t" /> + <ngram occurrences="172" value="j" /> + <ngram occurrences="155" value="v" /> + <ngram occurrences="150" value="k" /> + <ngram occurrences="148" value="e_" /> + <ngram occurrences="141" value="d" /> + <ngram occurrences="138" value="a_" /> + <ngram occurrences="123" value="z" /> + <ngram occurrences="120" value="p" /> + <ngram occurrences="119" value="y" /> + <ngram occurrences="114" value="o_" /> + <ngram occurrences="101" value="m" /> + <ngram occurrences="100" value="i_" /> + <ngram occurrences="100" value="_s" /> + <ngram occurrences="91" value="c" /> + <ngram occurrences="82" value="_p" /> + <ngram occurrences="79" value="_n" /> + <ngram occurrences="78" value="je" /> + <ngram occurrences="71" value="cy" /> + <ngram occurrences="69" value="_v" /> + <ngram occurrences="64" value="b" /> + <ngram occurrences="61" value="u" /> + <ngram occurrences="57" value="_z" /> + <ngram occurrences="56" value="je_" /> + <ngram occurrences="55" value="na" /> + <ngram occurrences="55" value="_j" /> + <ngram occurrences="53" value="st" /> + <ngram occurrences="53" value="ra" /> + <ngram occurrences="52" value="g" /> + <ngram occurrences="50" value="ni" /> + <ngram occurrences="50" value="_je" /> + <ngram occurrences="48" value="_je_" /> + <ngram occurrences="46" value="se" /> + <ngram occurrences="46" value="al" /> + <ngram occurrences="45" value="po" /> + <ngram occurrences="45" value="in" /> + <ngram occurrences="42" value="h" /> + <ngram occurrences="42" value="el" /> + <ngram occurrences="42" value="_k" /> + <ngram occurrences="41" value="la" /> + <ngram occurrences="40" value="no" /> + <ngram occurrences="39" value="ye" /> + <ngram occurrences="39" value="n_" /> + <ngram occurrences="38" value="ti" /> + <ngram occurrences="38" value="_o" /> + <ngram occurrences="38" value="_d" /> + <ngram occurrences="37" value="re" /> + <ngram occurrences="37" value="il" /> + <ngram occurrences="36" value="ne" /> + <ngram occurrences="36" value="_t" /> + <ngram occurrences="36" value="_na" /> + <ngram occurrences="36" value="_i" /> + <ngram occurrences="35" value="ko" /> + <ngram occurrences="35" value="en" /> + <ngram occurrences="35" value="_po" /> + <ngram occurrences="34" value="ve" /> + <ngram occurrences="34" value="v_" /> + <ngram occurrences="34" value="pr" /> + <ngram occurrences="34" value="ja" /> + <ngram occurrences="34" value="de" /> + <ngram occurrences="33" value="va" /> + <ngram occurrences="33" value="lo" /> + <ngram occurrences="32" value="l_" /> + <ngram occurrences="32" value="_m" /> + <ngram occurrences="31" value="ka" /> + <ngram occurrences="30" value="za" /> + <ngram occurrences="30" value="ov" /> + <ngram occurrences="30" value="li" /> + <ngram occurrences="30" value="le" /> + <ngram occurrences="30" value="_b" /> + <ngram occurrences="29" value="zy" /> + <ngram occurrences="29" value="te" /> + <ngram occurrences="29" value="ri" /> + <ngram occurrences="29" value="nj" /> + <ngram occurrences="29" value="_se" /> + <ngram occurrences="28" value="an" /> + <ngram occurrences="28" value="aj" /> + <ngram occurrences="27" value="od" /> + <ngram occurrences="27" value="et" /> + <ngram occurrences="27" value="da" /> + <ngram occurrences="26" value="to" /> + <ngram occurrences="26" value="h_" /> + <ngram occurrences="26" value="_pr" /> + <ngram occurrences="25" value="ro" /> + <ngram occurrences="25" value="ek" /> + <ngram occurrences="25" value="_za" /> + <ngram occurrences="24" value="ih" /> + <ngram occurrences="24" value="ed" /> + <ngram occurrences="23" value="yi" /> + <ngram occurrences="23" value="se_" /> + <ngram occurrences="23" value="m_" /> + <ngram occurrences="23" value="_v_" /> + <ngram occurrences="23" value="_r" /> + <ngram occurrences="22" value="u_" /> + <ngram occurrences="22" value="oc" /> + <ngram occurrences="22" value="na_" /> + <ngram occurrences="22" value="la_" /> + <ngram occurrences="22" value="ih_" /> + <ngram occurrences="22" value="ad" /> + <ngram occurrences="22" value="_se_" /> + <ngram occurrences="21" value="so" /> + <ngram occurrences="21" value="r_" /> + <ngram occurrences="21" value="ocy" /> + <ngram occurrences="21" value="no_" /> + <ngram occurrences="21" value="lo_" /> + <ngram occurrences="21" value="em" /> + <ngram occurrences="21" value="_ne" /> + <ngram occurrences="20" value="tr" /> + <ngram occurrences="20" value="t_" /> + <ngram occurrences="20" value="ob" /> + <ngram occurrences="20" value="ji" /> + <ngram occurrences="20" value="iz" /> + <ngram occurrences="20" value="ar" /> + <ngram occurrences="19" value="ya" /> + <ngram occurrences="19" value="sy" /> + <ngram occurrences="19" value="o_s" /> + <ngram occurrences="19" value="mi" /> + <ngram occurrences="19" value="ki" /> + <ngram occurrences="19" value="in_" /> + <ngram occurrences="19" value="ic" /> + <ngram occurrences="19" value="i_s" /> + <ngram occurrences="19" value="es" /> + <ngram occurrences="19" value="_ve" /> + <ngram occurrences="19" value="_so" /> + <ngram occurrences="19" value="_in_" /> + <ngram occurrences="19" value="_in" /> + <ngram occurrences="18" value="z_" /> + <ngram occurrences="18" value="ta" /> + <ngram occurrences="18" value="os" /> + <ngram occurrences="18" value="mo" /> + <ngram occurrences="18" value="ja_" /> + <ngram occurrences="18" value="ik" /> + <ngram occurrences="18" value="er" /> + <ngram occurrences="18" value="e_n" /> + <ngram occurrences="18" value="cye" /> + <ngram occurrences="18" value="ak" /> + <ngram occurrences="17" value="ye_" /> + <ngram occurrences="17" value="lj" /> + <ngram occurrences="17" value="is" /> + <ngram occurrences="17" value="ga" /> + <ngram occurrences="17" value="bi" /> + <ngram occurrences="17" value="az" /> + <ngram occurrences="17" value="as" /> + <ngram occurrences="17" value="a_s" /> + <ngram occurrences="16" value="ti_" /> + <ngram occurrences="16" value="so_" /> + <ngram occurrences="16" value="pre" /> + <ngram occurrences="16" value="pa" /> + <ngram occurrences="16" value="on" /> + <ngram occurrences="16" value="ol" /> + <ngram occurrences="16" value="og" /> + <ngram occurrences="16" value="o_n" /> + <ngram occurrences="16" value="ns" /> + <ngram occurrences="16" value="ne_" /> + <ngram occurrences="16" value="kr" /> + <ngram occurrences="16" value="ec" /> + <ngram occurrences="16" value="e_p" /> + <ngram occurrences="16" value="at" /> + <ngram occurrences="16" value="a_p" /> + <ngram occurrences="16" value="_c" /> + <ngram occurrences="15" value="zye" /> + <ngram occurrences="15" value="vo" /> + <ngram occurrences="15" value="sa" /> + <ngram occurrences="15" value="ot" /> + <ngram occurrences="15" value="or" /> + <ngram occurrences="15" value="om" /> + <ngram occurrences="15" value="j_" /> + <ngram occurrences="15" value="im" /> + <ngram occurrences="15" value="go" /> + <ngram occurrences="15" value="e_z" /> + <ngram occurrences="15" value="e_s" /> + <ngram occurrences="15" value="_so_" /> + <ngram occurrences="15" value="_iz" /> + <ngram occurrences="15" value="_g" /> + <ngram occurrences="15" value="_bi" /> + <ngram occurrences="14" value="yn" /> + <ngram occurrences="14" value="nje" /> + <ngram occurrences="14" value="li_" /> + <ngram occurrences="14" value="ko_" /> + <ngram occurrences="14" value="k_" /> + <ngram occurrences="14" value="ecy" /> + <ngram occurrences="14" value="dn" /> + <ngram occurrences="14" value="di" /> + <ngram occurrences="14" value="da_" /> + <ngram occurrences="14" value="cyi" /> + <ngram occurrences="14" value="av" /> + <ngram occurrences="14" value="_pre" /> + <ngram occurrences="14" value="_ko" /> + <ngram occurrences="13" value="raz" /> + <ngram occurrences="13" value="me" /> + <ngram occurrences="13" value="ke" /> + <ngram occurrences="13" value="ir" /> + <ngram occurrences="13" value="ins" /> + <ngram occurrences="13" value="ga_" /> + <ngram occurrences="13" value="em_" /> + <ngram occurrences="13" value="e_j" /> + <ngram occurrences="13" value="do" /> + <ngram occurrences="13" value="br" /> + <ngram occurrences="13" value="ap" /> + <ngram occurrences="13" value="a_v" /> + <ngram occurrences="13" value="_na_" /> + <ngram occurrences="13" value="_da" /> + <ngram occurrences="12" value="sto" /> + <ngram occurrences="12" value="ova" /> + <ngram occurrences="12" value="ok" /> + <ngram occurrences="12" value="ni_" /> + <ngram occurrences="12" value="ez" /> + <ngram occurrences="12" value="eg" /> + <ngram occurrences="12" value="cya" /> + <ngram occurrences="12" value="bil" /> + <ngram occurrences="12" value="al_" /> + <ngram occurrences="12" value="a_k" /> + <ngram occurrences="12" value="_st" /> + <ngram occurrences="12" value="_ni" /> + <ngram occurrences="12" value="_cy" /> + <ngram occurrences="12" value="_bil" /> + <ngram occurrences="11" value="vi" /> + <ngram occurrences="11" value="sk" /> + <ngram occurrences="11" value="ost" /> + <ngram occurrences="11" value="nst" /> + <ngram occurrences="11" value="le_" /> + <ngram occurrences="11" value="jo" /> + <ngram occurrences="11" value="ilo_" /> + <ngram occurrences="11" value="ilo" /> + <ngram occurrences="11" value="ij" /> + <ngram occurrences="11" value="ev" /> + <ngram occurrences="11" value="elo" /> + <ngram occurrences="11" value="e_v" /> + <ngram occurrences="11" value="e_b" /> + <ngram occurrences="11" value="del" /> + <ngram occurrences="11" value="cyn" /> + <ngram occurrences="11" value="ala" /> + <ngram occurrences="11" value="aj_" /> + <ngram occurrences="11" value="a_n" /> + <ngram occurrences="11" value="_zy" /> + <ngram occurrences="11" value="_ra" /> + <ngram occurrences="11" value="_pa" /> + <ngram occurrences="11" value="_mo" /> + <ngram occurrences="11" value="_l" /> + <ngram occurrences="11" value="_do" /> + <ngram occurrences="10" value="yal" /> + <ngram occurrences="10" value="y_" /> + <ngram occurrences="10" value="winst" /> + <ngram occurrences="10" value="wins" /> + <ngram occurrences="10" value="win" /> + <ngram occurrences="10" value="wi" /> + <ngram occurrences="10" value="w" /> + <ngram occurrences="10" value="un" /> + <ngram occurrences="10" value="ton" /> + <ngram occurrences="10" value="to_" /> + <ngram occurrences="10" value="ston" /> + <ngram occurrences="10" value="rat" /> + <ngram occurrences="10" value="o_b" /> + <ngram occurrences="10" value="nston" /> + <ngram occurrences="10" value="nsto" /> + <ngram occurrences="10" value="mi_" /> + <ngram occurrences="10" value="ln" /> + <ngram occurrences="10" value="ka_" /> + <ngram occurrences="10" value="ji_" /> + <ngram occurrences="10" value="insto" /> + <ngram occurrences="10" value="inst" /> + <ngram occurrences="10" value="i_p" /> + <ngram occurrences="10" value="eti" /> + <ngram occurrences="10" value="e_m" /> + <ngram occurrences="10" value="e_je" /> + <ngram occurrences="10" value="d_" /> + <ngram occurrences="10" value="cye_" /> + <ngram occurrences="10" value="ce" /> + <ngram occurrences="10" value="anj" /> + <ngram occurrences="10" value="ali_" /> + <ngram occurrences="10" value="ali" /> + <ngram occurrences="10" value="ala_" /> + <ngram occurrences="10" value="ac" /> + <ngram occurrences="10" value="a_je_" /> + <ngram occurrences="10" value="a_je" /> + <ngram occurrences="10" value="a_j" /> + <ngram occurrences="10" value="a_d" /> + <ngram occurrences="10" value="_wins" /> + <ngram occurrences="10" value="_win" /> + <ngram occurrences="10" value="_wi" /> + <ngram occurrences="10" value="_w" /> + <ngram occurrences="10" value="_te" /> + <ngram occurrences="10" value="_od" /> + <ngram occurrences="10" value="_ob" /> + <ngram occurrences="9" value="za_" /> + <ngram occurrences="9" value="se_j" /> + <ngram occurrences="9" value="rj" /> + <ngram occurrences="9" value="po_" /> + <ngram occurrences="9" value="pi" /> + <ngram occurrences="9" value="pe" /> + <ngram occurrences="9" value="oz" /> + <ngram occurrences="9" value="ov_" /> + <ngram occurrences="9" value="o_p" /> + <ngram occurrences="9" value="nu" /> + <ngram occurrences="9" value="nic" /> + <ngram occurrences="9" value="kra" /> + <ngram occurrences="9" value="ki_" /> + <ngram occurrences="9" value="je_n" /> + <ngram occurrences="9" value="it" /> + <ngram occurrences="9" value="il_" /> + <ngram occurrences="9" value="icy" /> + <ngram occurrences="9" value="i_v" /> + <ngram occurrences="9" value="i_n" /> + <ngram occurrences="9" value="er_" /> + <ngram occurrences="9" value="elo_" /> + <ngram occurrences="9" value="e_r" /> + <ngram occurrences="9" value="e_na" /> + <ngram occurrences="9" value="e_je_" /> + <ngram occurrences="9" value="am" /> + <ngram occurrences="9" value="acy" /> + <ngram occurrences="9" value="a_po" /> + <ngram occurrences="9" value="_se_j" /> + <ngram occurrences="9" value="_po_" /> + <ngram occurrences="9" value="_ka" /> + <ngram occurrences="9" value="_da_" /> + <ngram occurrences="8" value="ze" /> + <ngram occurrences="8" value="yil" /> + <ngram occurrences="8" value="vr" /> + <ngram occurrences="8" value="val" /> + <ngram occurrences="8" value="tv" /> + <ngram occurrences="8" value="stv" /> + <ngram occurrences="8" value="ran" /> + <ngram occurrences="8" value="o_na" /> + <ngram occurrences="8" value="n_s" /> + <ngram occurrences="8" value="ma" /> + <ngram occurrences="8" value="kl" /> + <ngram occurrences="8" value="jen" /> + <ngram occurrences="8" value="ist" /> + <ngram occurrences="8" value="imi_" /> + <ngram occurrences="8" value="imi" /> + <ngram occurrences="8" value="i_j" /> + <ngram occurrences="8" value="ezy" /> + <ngram occurrences="8" value="ese" /> + <ngram occurrences="8" value="en_" /> + <ngram occurrences="8" value="eli" /> + <ngram occurrences="8" value="el_" /> + <ngram occurrences="8" value="e_pr" /> + <ngram occurrences="8" value="cy_" /> + <ngram occurrences="8" value="bo" /> + <ngram occurrences="8" value="ah" /> + <ngram occurrences="8" value="a_z" /> + <ngram occurrences="8" value="a_o" /> + <ngram occurrences="8" value="_zye" /> + <ngram occurrences="8" value="_re" /> + <ngram occurrences="8" value="_nj" /> + <ngram occurrences="8" value="_mi" /> + <ngram occurrences="8" value="_kr" /> + <ngram occurrences="8" value="_de" /> + <ngram occurrences="8" value="_br" /> + <ngram occurrences="8" value="_a" /> + <ngram occurrences="7" value="yno_" /> + <ngram occurrences="7" value="yno" /> + <ngram occurrences="7" value="var" /> + <ngram occurrences="7" value="ton_" /> + <ngram occurrences="7" value="tem" /> + <ngram occurrences="7" value="tak" /> + <ngram occurrences="7" value="str" /> + <ngram occurrences="7" value="ston_" /> + <ngram occurrences="7" value="sti" /> + <ngram occurrences="7" value="ste" /> + <ngram occurrences="7" value="sp" /> + <ngram occurrences="7" value="set" /> + <ngram occurrences="7" value="sed" /> + <ngram occurrences="7" value="pri" /> + <ngram occurrences="7" value="pol" /> + <ngram occurrences="7" value="pa_" /> + <ngram occurrences="7" value="on_" /> + <ngram occurrences="7" value="o_t" /> + <ngram occurrences="7" value="o_se" /> + <ngram occurrences="7" value="o_d" /> + <ngram occurrences="7" value="nov" /> + <ngram occurrences="7" value="nost" /> + <ngram occurrences="7" value="nos" /> + <ngram occurrences="7" value="nih_" /> + <ngram occurrences="7" value="nih" /> + <ngram occurrences="7" value="na_s" /> + <ngram occurrences="7" value="lik" /> + <ngram occurrences="7" value="kih_" /> + <ngram occurrences="7" value="kih" /> + <ngram occurrences="7" value="ke_" /> + <ngram occurrences="7" value="ju" /> + <ngram occurrences="7" value="je_s" /> + <ngram occurrences="7" value="je_p" /> + <ngram occurrences="7" value="je_bi" /> + <ngram occurrences="7" value="je_b" /> + <ngram occurrences="7" value="iz_" /> + <ngram occurrences="7" value="i_z" /> + <ngram occurrences="7" value="i_m" /> + <ngram occurrences="7" value="gl" /> + <ngram occurrences="7" value="et_" /> + <ngram occurrences="7" value="elik" /> +</ngrams> diff --git a/src/plugins/language/slovenian2.klp b/src/plugins/language/slovenian2.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="662" value="_" /> + <ngram occurrences="375" value="a" /> + <ngram occurrences="335" value="o" /> + <ngram occurrences="311" value="e" /> + <ngram occurrences="269" value="n" /> + <ngram occurrences="248" value="i" /> + <ngram occurrences="201" value="r" /> + <ngram occurrences="190" value="v" /> + <ngram occurrences="179" value="s" /> + <ngram occurrences="169" value="t" /> + <ngram occurrences="152" value="k" /> + <ngram occurrences="151" value="l" /> + <ngram occurrences="148" value="c" /> + <ngram occurrences="143" value="p" /> + <ngram occurrences="138" value="u" /> + <ngram occurrences="137" value="d" /> + <ngram occurrences="112" value="a_" /> + <ngram occurrences="108" value="y" /> + <ngram occurrences="96" value="m" /> + <ngram occurrences="92" value="h" /> + <ngram occurrences="83" value="e_" /> + <ngram occurrences="81" value="z" /> + <ngram occurrences="80" value="_p" /> + <ngram occurrences="79" value="na" /> + <ngram occurrences="69" value="_v" /> + <ngram occurrences="65" value="j" /> + <ngram occurrences="65" value="_s" /> + <ngram occurrences="61" value="ov" /> + <ngram occurrences="60" value="po" /> + <ngram occurrences="58" value="_n" /> + <ngram occurrences="57" value="i_" /> + <ngram occurrences="55" value="v_" /> + <ngram occurrences="53" value="u_" /> + <ngram occurrences="53" value="ro" /> + <ngram occurrences="53" value="b" /> + <ngram occurrences="51" value="o_" /> + <ngram occurrences="47" value="_na" /> + <ngram occurrences="46" value="ch" /> + <ngram occurrences="45" value="y_" /> + <ngram occurrences="43" value="ne" /> + <ngram occurrences="43" value="_a" /> + <ngram occurrences="41" value="en" /> + <ngram occurrences="41" value="_z" /> + <ngram occurrences="40" value="re" /> + <ngram occurrences="39" value="st" /> + <ngram occurrences="39" value="h_" /> + <ngram occurrences="38" value="la" /> + <ngram occurrences="38" value="an" /> + <ngram occurrences="37" value="_po" /> + <ngram occurrences="35" value="pr" /> + <ngram occurrences="34" value="ch_" /> + <ngram occurrences="34" value="_t" /> + <ngram occurrences="33" value="vy" /> + <ngram occurrences="32" value="ci" /> + <ngram occurrences="32" value="_v_" /> + <ngram occurrences="32" value="_o" /> + <ngram occurrences="31" value="od" /> + <ngram occurrences="31" value="na_" /> + <ngram occurrences="31" value="ie" /> + <ngram occurrences="31" value="_pr" /> + <ngram occurrences="30" value="ko" /> + <ngram occurrences="30" value="_m" /> + <ngram occurrences="29" value="sk" /> + <ngram occurrences="29" value="_k" /> + <ngram occurrences="28" value="ti" /> + <ngram occurrences="28" value="er" /> + <ngram occurrences="27" value="ve" /> + <ngram occurrences="27" value="al" /> + <ngram occurrences="27" value="_r" /> + <ngram occurrences="26" value="ra" /> + <ngram occurrences="26" value="or" /> + <ngram occurrences="26" value="ni" /> + <ngram occurrences="26" value="in" /> + <ngram occurrences="26" value="ed" /> + <ngram occurrences="25" value="yc" /> + <ngram occurrences="25" value="va" /> + <ngram occurrences="25" value="ny" /> + <ngram occurrences="25" value="mi" /> + <ngram occurrences="25" value="ak" /> + <ngram occurrences="24" value="ych" /> + <ngram occurrences="24" value="to" /> + <ngram occurrences="24" value="le" /> + <ngram occurrences="24" value="ho" /> + <ngram occurrences="24" value="ce" /> + <ngram occurrences="24" value="ad" /> + <ngram occurrences="24" value="ac" /> + <ngram occurrences="24" value="_na_" /> + <ngram occurrences="24" value="_d" /> + <ngram occurrences="23" value="tr" /> + <ngram occurrences="23" value="t_" /> + <ngram occurrences="23" value="si" /> + <ngram occurrences="23" value="ov_" /> + <ngram occurrences="23" value="ka" /> + <ngram occurrences="23" value="_c" /> + <ngram occurrences="22" value="ych_" /> + <ngram occurrences="22" value="no" /> + <ngram occurrences="22" value="li" /> + <ngram occurrences="22" value="il" /> + <ngram occurrences="22" value="_u" /> + <ngram occurrences="21" value="te" /> + <ngram occurrences="21" value="sa" /> + <ngram occurrences="21" value="ok" /> + <ngram occurrences="20" value="os" /> + <ngram occurrences="20" value="om" /> + <ngram occurrences="20" value="it" /> + <ngram occurrences="20" value="do" /> + <ngram occurrences="19" value="za" /> + <ngram occurrences="19" value="ta" /> + <ngram occurrences="19" value="me" /> + <ngram occurrences="19" value="l_" /> + <ngram occurrences="19" value="ku" /> + <ngram occurrences="19" value="ia" /> + <ngram occurrences="19" value="da" /> + <ngram occurrences="19" value="_b" /> + <ngram occurrences="18" value="pre" /> + <ngram occurrences="18" value="m_" /> + <ngram occurrences="18" value="es" /> + <ngram occurrences="18" value="a_p" /> + <ngram occurrences="18" value="_a_" /> + <ngram occurrences="17" value="oc" /> + <ngram occurrences="17" value="ej" /> + <ngram occurrences="17" value="aj" /> + <ngram occurrences="17" value="_sa" /> + <ngram occurrences="17" value="_pre" /> + <ngram occurrences="16" value="ur" /> + <ngram occurrences="16" value="r_" /> + <ngram occurrences="16" value="on" /> + <ngram occurrences="16" value="ol" /> + <ngram occurrences="16" value="lo" /> + <ngram occurrences="16" value="ky" /> + <ngram occurrences="16" value="j_" /> + <ngram occurrences="16" value="el" /> + <ngram occurrences="16" value="at" /> + <ngram occurrences="16" value="ap" /> + <ngram occurrences="16" value="_za" /> + <ngram occurrences="16" value="_vy" /> + <ngram occurrences="15" value="vo" /> + <ngram occurrences="15" value="sa_" /> + <ngram occurrences="15" value="rok" /> + <ngram occurrences="15" value="ri" /> + <ngram occurrences="15" value="ne_" /> + <ngram occurrences="15" value="ic" /> + <ngram occurrences="15" value="f" /> + <ngram occurrences="15" value="av" /> + <ngram occurrences="15" value="as" /> + <ngram occurrences="15" value="_ro" /> + <ngram occurrences="15" value="_j" /> + <ngram occurrences="14" value="zi" /> + <ngram occurrences="14" value="ob" /> + <ngram occurrences="14" value="nych_" /> + <ngram occurrences="14" value="nych" /> + <ngram occurrences="14" value="nyc" /> + <ngram occurrences="14" value="ke" /> + <ngram occurrences="14" value="k_" /> + <ngram occurrences="14" value="eh" /> + <ngram occurrences="14" value="d_" /> + <ngram occurrences="14" value="_sa_" /> + <ngram occurrences="13" value="v_p" /> + <ngram occurrences="13" value="us" /> + <ngram occurrences="13" value="pod" /> + <ngram occurrences="13" value="ot" /> + <ngram occurrences="13" value="nu" /> + <ngram occurrences="13" value="ln" /> + <ngram occurrences="13" value="ie_" /> + <ngram occurrences="13" value="ho_" /> + <ngram occurrences="13" value="eho_" /> + <ngram occurrences="13" value="eho" /> + <ngram occurrences="13" value="e_v" /> + <ngram occurrences="13" value="dn" /> + <ngram occurrences="13" value="di" /> + <ngram occurrences="13" value="de" /> + <ngram occurrences="13" value="co" /> + <ngram occurrences="13" value="am" /> + <ngram occurrences="13" value="a_v" /> + <ngram occurrences="13" value="_do" /> + <ngram occurrences="12" value="sp" /> + <ngram occurrences="12" value="rov" /> + <ngram occurrences="12" value="pa" /> + <ngram occurrences="12" value="nt" /> + <ngram occurrences="12" value="n_" /> + <ngram occurrences="12" value="li_" /> + <ngram occurrences="12" value="g" /> + <ngram occurrences="12" value="ar" /> + <ngram occurrences="12" value="a_n" /> + <ngram occurrences="12" value="_ak" /> + <ngram occurrences="11" value="zn" /> + <ngram occurrences="11" value="vi" /> + <ngram occurrences="11" value="om_" /> + <ngram occurrences="11" value="ny_" /> + <ngram occurrences="11" value="la_" /> + <ngram occurrences="11" value="ky_" /> + <ngram occurrences="11" value="kt" /> + <ngram occurrences="11" value="em" /> + <ngram occurrences="11" value="ej_" /> + <ngram occurrences="11" value="e_p" /> + <ngram occurrences="11" value="e_n" /> + <ngram occurrences="11" value="az" /> + <ngram occurrences="11" value="a_s" /> + <ngram occurrences="11" value="_tr" /> + <ngram occurrences="11" value="_pod" /> + <ngram occurrences="11" value="_h" /> + <ngram occurrences="11" value="_ce" /> + <ngram occurrences="10" value="zv" /> + <ngram occurrences="10" value="z_" /> + <ngram occurrences="10" value="pe" /> + <ngram occurrences="10" value="oz" /> + <ngram occurrences="10" value="ovy" /> + <ngram occurrences="10" value="ove" /> + <ngram occurrences="10" value="ova" /> + <ngram occurrences="10" value="nc" /> + <ngram occurrences="10" value="nan" /> + <ngram occurrences="10" value="ka_" /> + <ngram occurrences="10" value="ju" /> + <ngram occurrences="10" value="ik" /> + <ngram occurrences="10" value="ek" /> + <ngram occurrences="10" value="du" /> + <ngram occurrences="10" value="cen" /> + <ngram occurrences="10" value="ast" /> + <ngram occurrences="10" value="a_po" /> + <ngram occurrences="10" value="a_na" /> + <ngram occurrences="10" value="_ob" /> + <ngram occurrences="10" value="_l" /> + <ngram occurrences="10" value="_i" /> + <ngram occurrences="10" value="_e" /> + <ngram occurrences="9" value="uro" /> + <ngram occurrences="9" value="tor" /> + <ngram occurrences="9" value="ti_" /> + <ngram occurrences="9" value="ska" /> + <ngram occurrences="9" value="ru" /> + <ngram occurrences="9" value="pri" /> + <ngram occurrences="9" value="pl" /> + <ngram occurrences="9" value="nu_" /> + <ngram occurrences="9" value="mo" /> + <ngram occurrences="9" value="lad" /> + <ngram occurrences="9" value="ku_" /> + <ngram occurrences="9" value="kov" /> + <ngram occurrences="9" value="kl" /> + <ngram occurrences="9" value="je" /> + <ngram occurrences="9" value="ja" /> + <ngram occurrences="9" value="iv" /> + <ngram occurrences="9" value="i_s" /> + <ngram occurrences="9" value="cov" /> + <ngram occurrences="9" value="_v_p" /> + <ngram occurrences="9" value="_ne" /> + <ngram occurrences="9" value="_mi" /> + <ngram occurrences="8" value="ze" /> + <ngram occurrences="8" value="ys" /> + <ngram occurrences="8" value="vys" /> + <ngram occurrences="8" value="vn" /> + <ngram occurrences="8" value="uc" /> + <ngram occurrences="8" value="tu" /> + <ngram occurrences="8" value="trh" /> + <ngram occurrences="8" value="su" /> + <ngram occurrences="8" value="st_" /> + <ngram occurrences="8" value="sl" /> + <ngram occurrences="8" value="ske" /> + <ngram occurrences="8" value="rh" /> + <ngram occurrences="8" value="red" /> + <ngram occurrences="8" value="pred" /> + <ngram occurrences="8" value="nej" /> + <ngram occurrences="8" value="mi_" /> + <ngram occurrences="8" value="ina" /> + <ngram occurrences="8" value="il_" /> + <ngram occurrences="8" value="ia_" /> + <ngram occurrences="8" value="et" /> + <ngram occurrences="8" value="est" /> + <ngram occurrences="8" value="er_" /> + <ngram occurrences="8" value="ent" /> + <ngram occurrences="8" value="en_" /> + <ngram occurrences="8" value="e_s" /> + <ngram occurrences="8" value="ca" /> + <ngram occurrences="8" value="ani" /> + <ngram occurrences="8" value="a_t" /> + <ngram occurrences="8" value="_zv" /> + <ngram occurrences="8" value="_ur" /> + <ngram occurrences="8" value="_trh" /> + <ngram occurrences="8" value="_st" /> + <ngram occurrences="8" value="_sp" /> + <ngram occurrences="8" value="_rok" /> + <ngram occurrences="8" value="_pri" /> + <ngram occurrences="8" value="_pred" /> + <ngram occurrences="8" value="_me" /> + <ngram occurrences="7" value="van" /> + <ngram occurrences="7" value="v_o" /> + <ngram occurrences="7" value="usd_" /> + <ngram occurrences="7" value="usd" /> + <ngram occurrences="7" value="up" /> + <ngram occurrences="7" value="uj" /> + <ngram occurrences="7" value="ud" /> + <ngram occurrences="7" value="u_a" /> + <ngram occurrences="7" value="to_" /> + <ngram occurrences="7" value="te_" /> + <ngram occurrences="7" value="sti" /> + <ngram occurrences="7" value="sta" /> + <ngram occurrences="7" value="spo" /> + <ngram occurrences="7" value="sil" /> + <ngram occurrences="7" value="sd_" /> + <ngram occurrences="7" value="sd" /> + <ngram occurrences="7" value="ost" /> + <ngram occurrences="7" value="oro" /> + <ngram occurrences="7" value="o_v" /> + <ngram occurrences="7" value="ns" /> + <ngram occurrences="7" value="nej_" /> + <ngram occurrences="7" value="neho_" /> + <ngram occurrences="7" value="neho" /> + <ngram occurrences="7" value="neh" /> + <ngram occurrences="7" value="naj" /> + <ngram occurrences="7" value="na_t" /> + <ngram occurrences="7" value="kci" /> + <ngram occurrences="7" value="kc" /> + <ngram occurrences="7" value="je_" /> + <ngram occurrences="7" value="is" /> + <ngram occurrences="7" value="hod" /> + <ngram occurrences="7" value="ep" /> + <ngram occurrences="7" value="eni" /> + <ngram occurrences="7" value="ec" /> + <ngram occurrences="7" value="du_" /> + <ngram occurrences="7" value="br" /> + <ngram occurrences="7" value="ati" /> + <ngram occurrences="7" value="ali" /> + <ngram occurrences="7" value="akci" /> + <ngram occurrences="7" value="akc" /> + <ngram occurrences="7" value="a_u" /> + <ngram occurrences="7" value="_usd_" /> + <ngram occurrences="7" value="_usd" /> + <ngram occurrences="7" value="_us" /> + <ngram occurrences="7" value="_uro" /> + <ngram occurrences="7" value="_su" /> + <ngram occurrences="7" value="_sk" /> + <ngram occurrences="7" value="_naj" /> + <ngram occurrences="7" value="_na_t" /> + <ngram occurrences="7" value="_in" /> + <ngram occurrences="7" value="_f" /> + <ngram occurrences="7" value="_cen" /> + <ngram occurrences="7" value="_akci" /> + <ngram occurrences="7" value="_akc" /> + <ngram occurrences="6" value="zac" /> + <ngram occurrences="6" value="y_p" /> + <ngram occurrences="6" value="y_a" /> + <ngram occurrences="6" value="vl" /> + <ngram occurrences="6" value="v_po" /> + <ngram occurrences="6" value="uk" /> + <ngram occurrences="6" value="u_p" /> + <ngram occurrences="6" value="u_n" /> + <ngram occurrences="6" value="u_a_" /> + <ngram occurrences="6" value="ty" /> + <ngram occurrences="6" value="tre" /> + <ngram occurrences="6" value="tn" /> + <ngram occurrences="6" value="tiv" /> + <ngram occurrences="6" value="sti_" /> + <ngram occurrences="6" value="ska_" /> + <ngram occurrences="6" value="sia" /> + <ngram occurrences="6" value="se" /> + <ngram occurrences="6" value="s_" /> + <ngram occurrences="6" value="roku_" /> + <ngram occurrences="6" value="roku" /> + <ngram occurrences="6" value="rod" /> + <ngram occurrences="6" value="ri_" /> + <ngram occurrences="6" value="re_" /> + <ngram occurrences="6" value="pos" /> + <ngram occurrences="6" value="por" /> + <ngram occurrences="6" value="otr" /> + <ngram occurrences="6" value="osl" /> + <ngram occurrences="6" value="ore" /> + <ngram occurrences="6" value="oku_" /> + <ngram occurrences="6" value="oku" /> + <ngram occurrences="6" value="odn" /> + <ngram occurrences="6" value="o_z" /> + <ngram occurrences="6" value="o_s" /> + <ngram occurrences="6" value="nsk" /> + <ngram occurrences="6" value="nov" /> + <ngram occurrences="6" value="ni_" /> + <ngram occurrences="6" value="mu" /> + <ngram occurrences="6" value="mie" /> + <ngram occurrences="6" value="ly" /> + <ngram occurrences="6" value="kon" /> + <ngram occurrences="6" value="ke_" /> + <ngram occurrences="6" value="iny_" /> + <ngram occurrences="6" value="iny" /> + <ngram occurrences="6" value="ii_" /> + <ngram occurrences="6" value="ii" /> + <ngram occurrences="6" value="id" /> + <ngram occurrences="6" value="i_v" /> + <ngram occurrences="6" value="i_n" /> + <ngram occurrences="6" value="hr" /> + <ngram occurrences="6" value="he" /> + <ngram occurrences="6" value="ele" /> + <ngram occurrences="6" value="eb" /> + <ngram occurrences="6" value="e_v_" /> + <ngram occurrences="6" value="e_po" /> + <ngram occurrences="6" value="e_na" /> + <ngram occurrences="6" value="e_m" /> + <ngram occurrences="6" value="cov_" /> + <ngram occurrences="6" value="cii_" /> + <ngram occurrences="6" value="cii" /> + <ngram occurrences="6" value="cie" /> + <ngram occurrences="6" value="cho" /> + <ngram occurrences="6" value="by" /> + <ngram occurrences="6" value="ast_" /> + <ngram occurrences="6" value="alo" /> +</ngrams> diff --git a/src/plugins/language/spanish.klp b/src/plugins/language/spanish.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="820" value="_" /> + <ngram occurrences="523" value="e" /> + <ngram occurrences="495" value="a" /> + <ngram occurrences="330" value="o" /> + <ngram occurrences="292" value="s" /> + <ngram occurrences="281" value="n" /> + <ngram occurrences="273" value="r" /> + <ngram occurrences="270" value="i" /> + <ngram occurrences="243" value="l" /> + <ngram occurrences="228" value="d" /> + <ngram occurrences="198" value="c" /> + <ngram occurrences="181" value="t" /> + <ngram occurrences="171" value="e_" /> + <ngram occurrences="168" value="a_" /> + <ngram occurrences="151" value="s_" /> + <ngram occurrences="150" value="u" /> + <ngram occurrences="125" value="m" /> + <ngram occurrences="121" value="de" /> + <ngram occurrences="118" value="p" /> + <ngram occurrences="115" value="_d" /> + <ngram occurrences="105" value="_de" /> + <ngram occurrences="97" value="o_" /> + <ngram occurrences="97" value="_l" /> + <ngram occurrences="89" value="la" /> + <ngram occurrences="86" value="de_" /> + <ngram occurrences="85" value="en" /> + <ngram occurrences="83" value="_de_" /> + <ngram occurrences="81" value="es" /> + <ngram occurrences="79" value="_p" /> + <ngram occurrences="78" value="n_" /> + <ngram occurrences="73" value="_e" /> + <ngram occurrences="70" value="_c" /> + <ngram occurrences="62" value="as" /> + <ngram occurrences="62" value="_la" /> + <ngram occurrences="61" value="os" /> + <ngram occurrences="59" value="ci" /> + <ngram occurrences="56" value="os_" /> + <ngram occurrences="52" value="or" /> + <ngram occurrences="52" value="ar" /> + <ngram occurrences="51" value="ra" /> + <ngram occurrences="51" value="_a" /> + <ngram occurrences="50" value="la_" /> + <ngram occurrences="50" value="er" /> + <ngram occurrences="49" value="r_" /> + <ngram occurrences="49" value="f" /> + <ngram occurrences="48" value="ue" /> + <ngram occurrences="48" value="nt" /> + <ngram occurrences="47" value="_la_" /> + <ngram occurrences="46" value="as_" /> + <ngram occurrences="45" value="te" /> + <ngram occurrences="45" value="an" /> + <ngram occurrences="44" value="_m" /> + <ngram occurrences="42" value="l_" /> + <ngram occurrences="42" value="do" /> + <ngram occurrences="41" value="st" /> + <ngram occurrences="41" value="re" /> + <ngram occurrences="41" value="_s" /> + <ngram occurrences="40" value="ta" /> + <ngram occurrences="40" value="es_" /> + <ngram occurrences="39" value="el" /> + <ngram occurrences="38" value="ad" /> + <ngram occurrences="37" value="v" /> + <ngram occurrences="37" value="on" /> + <ngram occurrences="37" value="b" /> + <ngram occurrences="36" value="y" /> + <ngram occurrences="36" value="po" /> + <ngram occurrences="36" value="g" /> + <ngram occurrences="36" value="e_l" /> + <ngram occurrences="36" value="co" /> + <ngram occurrences="36" value="ca" /> + <ngram occurrences="36" value="al" /> + <ngram occurrences="35" value="to" /> + <ngram occurrences="35" value="lo" /> + <ngram occurrences="34" value="se" /> + <ngram occurrences="33" value="na" /> + <ngram occurrences="32" value="qu" /> + <ngram occurrences="32" value="q" /> + <ngram occurrences="31" value="ue_" /> + <ngram occurrences="31" value="s_d" /> + <ngram occurrences="31" value="que" /> + <ngram occurrences="31" value="in" /> + <ngram occurrences="31" value="ic" /> + <ngram occurrences="31" value="ent" /> + <ngram occurrences="30" value="ó" /> + <ngram occurrences="30" value="ro" /> + <ngram occurrences="30" value="h" /> + <ngram occurrences="29" value="un" /> + <ngram occurrences="29" value="mi" /> + <ngram occurrences="29" value="el_" /> + <ngram occurrences="29" value="_po" /> + <ngram occurrences="28" value="í" /> + <ngram occurrences="28" value="s_de" /> + <ngram occurrences="28" value="pa" /> + <ngram occurrences="28" value="le" /> + <ngram occurrences="28" value="da" /> + <ngram occurrences="28" value="_y" /> + <ngram occurrences="28" value="_co" /> + <ngram occurrences="27" value="y_" /> + <ngram occurrences="27" value="que_" /> + <ngram occurrences="27" value="do_" /> + <ngram occurrences="26" value="s_de_" /> + <ngram occurrences="26" value="ni" /> + <ngram occurrences="26" value="e_la" /> + <ngram occurrences="26" value="ac" /> + <ngram occurrences="26" value="a_d" /> + <ngram occurrences="26" value="_en" /> + <ngram occurrences="25" value="tr" /> + <ngram occurrences="25" value="de_l" /> + <ngram occurrences="25" value="_que_" /> + <ngram occurrences="25" value="_que" /> + <ngram occurrences="25" value="_qu" /> + <ngram occurrences="25" value="_q" /> + <ngram occurrences="25" value="_de_l" /> + <ngram occurrences="24" value="por" /> + <ngram occurrences="24" value="ie" /> + <ngram occurrences="24" value="id" /> + <ngram occurrences="24" value="en_" /> + <ngram occurrences="24" value="ec" /> + <ngram occurrences="24" value="a_de" /> + <ngram occurrences="24" value="_f" /> + <ngram occurrences="23" value="ti" /> + <ngram occurrences="23" value="or_" /> + <ngram occurrences="23" value="ma" /> + <ngram occurrences="23" value="ió" /> + <ngram occurrences="23" value="_y_" /> + <ngram occurrences="22" value="ón_" /> + <ngram occurrences="22" value="ón" /> + <ngram occurrences="22" value="á" /> + <ngram occurrences="22" value="ri" /> + <ngram occurrences="22" value="nd" /> + <ngram occurrences="22" value="_t" /> + <ngram occurrences="22" value="_lo" /> + <ngram occurrences="21" value="pr" /> + <ngram occurrences="21" value="me" /> + <ngram occurrences="21" value="ión_" /> + <ngram occurrences="21" value="ión" /> + <ngram occurrences="21" value="e_la_" /> + <ngram occurrences="21" value="_se" /> + <ngram occurrences="21" value="_por" /> + <ngram occurrences="20" value="te_" /> + <ngram occurrences="20" value="o_d" /> + <ngram occurrences="20" value="nte" /> + <ngram occurrences="20" value="ne" /> + <ngram occurrences="20" value="j" /> + <ngram occurrences="20" value="e_p" /> + <ngram occurrences="20" value="e_e" /> + <ngram occurrences="20" value="ció" /> + <ngram occurrences="20" value="a_l" /> + <ngram occurrences="20" value="_i" /> + <ngram occurrences="20" value="_en_" /> + <ngram occurrences="20" value="_el_" /> + <ngram occurrences="20" value="_el" /> + <ngram occurrences="19" value="por_" /> + <ngram occurrences="19" value="om" /> + <ngram occurrences="19" value="o_de" /> + <ngram occurrences="19" value="est" /> + <ngram occurrences="19" value="di" /> + <ngram occurrences="19" value="de_la" /> + <ngram occurrences="19" value="ción_" /> + <ngram occurrences="19" value="ción" /> + <ngram occurrences="19" value="ce" /> + <ngram occurrences="19" value="a_c" /> + <ngram occurrences="19" value="_por_" /> + <ngram occurrences="19" value="_h" /> + <ngram occurrences="18" value="to_" /> + <ngram occurrences="18" value="io" /> + <ngram occurrences="18" value="aci" /> + <ngram occurrences="18" value="_pr" /> + <ngram occurrences="18" value="_es" /> + <ngram occurrences="17" value="los_" /> + <ngram occurrences="17" value="los" /> + <ngram occurrences="17" value="a_de_" /> + <ngram occurrences="17" value="_u" /> + <ngram occurrences="16" value="ía" /> + <ngram occurrences="16" value="ta_" /> + <ngram occurrences="16" value="oc" /> + <ngram occurrences="16" value="no" /> + <ngram occurrences="16" value="ado" /> + <ngram occurrences="16" value="a_p" /> + <ngram occurrences="16" value="_pa" /> + <ngram occurrences="16" value="_n" /> + <ngram occurrences="15" value="z" /> + <ngram occurrences="15" value="se_" /> + <ngram occurrences="15" value="ra_" /> + <ngram occurrences="15" value="o_de_" /> + <ngram occurrences="15" value="na_" /> + <ngram occurrences="15" value="n_l" /> + <ngram occurrences="15" value="mo" /> + <ngram occurrences="15" value="is" /> + <ngram occurrences="15" value="_v" /> + <ngram occurrences="15" value="_un" /> + <ngram occurrences="15" value="_r" /> + <ngram occurrences="15" value="_los_" /> + <ngram occurrences="15" value="_los" /> + <ngram occurrences="15" value="_a_" /> + <ngram occurrences="14" value="ía_" /> + <ngram occurrences="14" value="si" /> + <ngram occurrences="14" value="li" /> + <ngram occurrences="14" value="las" /> + <ngram occurrences="14" value="im" /> + <ngram occurrences="14" value="ien" /> + <ngram occurrences="14" value="dad" /> + <ngram occurrences="14" value="cu" /> + <ngram occurrences="14" value="_o" /> + <ngram occurrences="14" value="_ma" /> + <ngram occurrences="13" value="tra" /> + <ngram occurrences="13" value="par" /> + <ngram occurrences="13" value="o_a" /> + <ngram occurrences="13" value="nto" /> + <ngram occurrences="13" value="mp" /> + <ngram occurrences="13" value="las_" /> + <ngram occurrences="13" value="ha" /> + <ngram occurrences="13" value="com" /> + <ngram occurrences="13" value="am" /> + <ngram occurrences="13" value="ación" /> + <ngram occurrences="13" value="ació" /> + <ngram occurrences="13" value="_mi" /> + <ngram occurrences="13" value="_las_" /> + <ngram occurrences="13" value="_las" /> + <ngram occurrences="13" value="_in" /> + <ngram occurrences="13" value="_ca" /> + <ngram occurrences="12" value="vi" /> + <ngram occurrences="12" value="sta" /> + <ngram occurrences="12" value="sa" /> + <ngram occurrences="12" value="s_l" /> + <ngram occurrences="12" value="rt" /> + <ngram occurrences="12" value="nto_" /> + <ngram occurrences="12" value="nte_" /> + <ngram occurrences="12" value="n_d" /> + <ngram occurrences="12" value="e_d" /> + <ngram occurrences="12" value="ara" /> + <ngram occurrences="12" value="ar_" /> + <ngram occurrences="12" value="_ci" /> + <ngram occurrences="11" value="ve" /> + <ngram occurrences="11" value="s_c" /> + <ngram occurrences="11" value="pl" /> + <ngram occurrences="11" value="ol" /> + <ngram occurrences="11" value="n_la" /> + <ngram occurrences="11" value="n_de" /> + <ngram occurrences="11" value="men" /> + <ngram occurrences="11" value="ll" /> + <ngram occurrences="11" value="la_c" /> + <ngram occurrences="11" value="il" /> + <ngram occurrences="11" value="ient" /> + <ngram occurrences="11" value="ica" /> + <ngram occurrences="11" value="ia" /> + <ngram occurrences="11" value="ga" /> + <ngram occurrences="11" value="fe" /> + <ngram occurrences="11" value="et" /> + <ngram occurrences="11" value="ento" /> + <ngram occurrences="11" value="em" /> + <ngram occurrences="11" value="e_s" /> + <ngram occurrences="11" value="e_c" /> + <ngram occurrences="11" value="dos" /> + <ngram occurrences="11" value="des" /> + <ngram occurrences="11" value="at" /> + <ngram occurrences="11" value="al_" /> + <ngram occurrences="11" value="a_m" /> + <ngram occurrences="11" value="a_la" /> + <ngram occurrences="11" value="a_e" /> + <ngram occurrences="11" value="_re" /> + <ngram occurrences="11" value="_par" /> + <ngram occurrences="11" value="_la_c" /> + <ngram occurrences="11" value="_com" /> + <ngram occurrences="10" value="ur" /> + <ngram occurrences="10" value="una" /> + <ngram occurrences="10" value="sp" /> + <ngram occurrences="10" value="s_p" /> + <ngram occurrences="10" value="rr" /> + <ngram occurrences="10" value="res" /> + <ngram occurrences="10" value="os_d" /> + <ngram occurrences="10" value="one" /> + <ngram occurrences="10" value="nes_" /> + <ngram occurrences="10" value="nes" /> + <ngram occurrences="10" value="nc" /> + <ngram occurrences="10" value="n_de_" /> + <ngram occurrences="10" value="mu" /> + <ngram occurrences="10" value="lo_" /> + <ngram occurrences="10" value="les" /> + <ngram occurrences="10" value="iv" /> + <ngram occurrences="10" value="ir" /> + <ngram occurrences="10" value="if" /> + <ngram occurrences="10" value="iento" /> + <ngram occurrences="10" value="ido" /> + <ngram occurrences="10" value="ici" /> + <ngram occurrences="10" value="ho" /> + <ngram occurrences="10" value="er_" /> + <ngram occurrences="10" value="ento_" /> + <ngram occurrences="10" value="ente" /> + <ngram occurrences="10" value="e_m" /> + <ngram occurrences="10" value="e_de" /> + <ngram occurrences="10" value="dos_" /> + <ngram occurrences="10" value="ba" /> + <ngram occurrences="10" value="ado_" /> + <ngram occurrences="10" value="_una" /> + <ngram occurrences="10" value="_se_" /> + <ngram occurrences="10" value="_j" /> + <ngram occurrences="10" value="_ha" /> + <ngram occurrences="10" value="_b" /> + <ngram occurrences="9" value="ón_de" /> + <ngram occurrences="9" value="ón_d" /> + <ngram occurrences="9" value="ñ" /> + <ngram occurrences="9" value="é" /> + <ngram occurrences="9" value="za" /> + <ngram occurrences="9" value="una_" /> + <ngram occurrences="9" value="ul" /> + <ngram occurrences="9" value="ud" /> + <ngram occurrences="9" value="ten" /> + <ngram occurrences="9" value="ste" /> + <ngram occurrences="9" value="so" /> + <ngram occurrences="9" value="s_y" /> + <ngram occurrences="9" value="s_s" /> + <ngram occurrences="9" value="s_que" /> + <ngram occurrences="9" value="s_qu" /> + <ngram occurrences="9" value="s_q" /> + <ngram occurrences="9" value="s_e" /> + <ngram occurrences="9" value="s_a" /> + <ngram occurrences="9" value="r_c" /> + <ngram occurrences="9" value="pu" /> + <ngram occurrences="9" value="pro" /> + <ngram occurrences="9" value="ot" /> + <ngram occurrences="9" value="os_de" /> + <ngram occurrences="9" value="on_" /> + <ngram occurrences="9" value="o_e" /> + <ngram occurrences="9" value="les_" /> + <ngram occurrences="9" value="ion" /> + <ngram occurrences="9" value="ida" /> + <ngram occurrences="9" value="gr" /> + <ngram occurrences="9" value="fi" /> + <ngram occurrences="9" value="es_d" /> + <ngram occurrences="9" value="e_los" /> + <ngram occurrences="9" value="e_lo" /> + <ngram occurrences="9" value="ct" /> + <ngram occurrences="9" value="cie" /> + <ngram occurrences="9" value="cal" /> + <ngram occurrences="9" value="as_de" /> + <ngram occurrences="9" value="as_d" /> + <ngram occurrences="9" value="and" /> + <ngram occurrences="9" value="an_" /> + <ngram occurrences="9" value="a_y" /> + <ngram occurrences="9" value="a_po" /> + <ngram occurrences="9" value="a_a" /> + <ngram occurrences="9" value="_una_" /> + <ngram occurrences="9" value="_pro" /> + <ngram occurrences="8" value="su" /> + <ngram occurrences="8" value="s_y_" /> + <ngram occurrences="8" value="rec" /> + <ngram occurrences="8" value="r_e" /> + <ngram occurrences="8" value="pe" /> + <ngram occurrences="8" value="para_" /> + <ngram occurrences="8" value="para" /> + <ngram occurrences="8" value="no_" /> + <ngram occurrences="8" value="nic" /> + <ngram occurrences="8" value="ndo" /> + <ngram occurrences="8" value="n_p" /> + <ngram occurrences="8" value="n_la_" /> + <ngram occurrences="8" value="n_c" /> + <ngram occurrences="8" value="ment" /> + <ngram occurrences="8" value="l_p" /> + <ngram occurrences="8" value="ión_d" /> + <ngram occurrences="8" value="ist" /> + <ngram occurrences="8" value="ido_" /> + <ngram occurrences="8" value="fu" /> + <ngram occurrences="8" value="fo" /> + <ngram occurrences="8" value="esp" /> + <ngram occurrences="8" value="es_de" /> + <ngram occurrences="8" value="eri" /> + <ngram occurrences="8" value="en_la" /> + <ngram occurrences="8" value="en_l" /> + <ngram occurrences="8" value="eg" /> + <ngram occurrences="8" value="ece" /> + <ngram occurrences="8" value="e_se" /> + <ngram occurrences="8" value="do_a" /> + <ngram occurrences="8" value="del_" /> + <ngram occurrences="8" value="del" /> + <ngram occurrences="8" value="de_p" /> + <ngram occurrences="8" value="de_m" /> + <ngram occurrences="8" value="con" /> + <ngram occurrences="8" value="cen" /> + <ngram occurrences="8" value="ara_" /> + <ngram occurrences="8" value="ant" /> + <ngram occurrences="8" value="ab" /> + <ngram occurrences="8" value="a_f" /> + <ngram occurrences="8" value="_tr" /> + <ngram occurrences="8" value="_para" /> + <ngram occurrences="8" value="_fu" /> + <ngram occurrences="8" value="_est" /> + <ngram occurrences="8" value="_en_l" /> + <ngram occurrences="8" value="_del_" /> + <ngram occurrences="8" value="_del" /> + <ngram occurrences="8" value="_de_m" /> + <ngram occurrences="8" value="_al" /> + <ngram occurrences="7" value="ú" /> + <ngram occurrences="7" value="x" /> + <ngram occurrences="7" value="ue_s" /> + <ngram occurrences="7" value="to_de" /> + <ngram occurrences="7" value="to_d" /> + <ngram occurrences="7" value="ter" /> + <ngram occurrences="7" value="str" /> + <ngram occurrences="7" value="sta_" /> +</ngrams> diff --git a/src/plugins/language/swahili.klp b/src/plugins/language/swahili.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="845" value="a" /> + <ngram occurrences="709" value="_" /> + <ngram occurrences="489" value="i" /> + <ngram occurrences="371" value="a_" /> + <ngram occurrences="261" value="k" /> + <ngram occurrences="250" value="u" /> + <ngram occurrences="200" value="n" /> + <ngram occurrences="192" value="w" /> + <ngram occurrences="178" value="m" /> + <ngram occurrences="168" value="o" /> + <ngram occurrences="165" value="e" /> + <ngram occurrences="162" value="wa" /> + <ngram occurrences="155" value="h" /> + <ngram occurrences="143" value="i_" /> + <ngram occurrences="137" value="s" /> + <ngram occurrences="134" value="t" /> + <ngram occurrences="134" value="l" /> + <ngram occurrences="129" value="_k" /> + <ngram occurrences="100" value="y" /> + <ngram occurrences="95" value="_w" /> + <ngram occurrences="85" value="_wa" /> + <ngram occurrences="83" value="wa_" /> + <ngram occurrences="80" value="_m" /> + <ngram occurrences="79" value="r" /> + <ngram occurrences="78" value="o_" /> + <ngram occurrences="78" value="ka" /> + <ngram occurrences="77" value="ku" /> + <ngram occurrences="75" value="li" /> + <ngram occurrences="73" value="z" /> + <ngram occurrences="71" value="ma" /> + <ngram occurrences="71" value="b" /> + <ngram occurrences="71" value="a_k" /> + <ngram occurrences="63" value="an" /> + <ngram occurrences="61" value="ya" /> + <ngram occurrences="59" value="g" /> + <ngram occurrences="56" value="ha" /> + <ngram occurrences="56" value="a_m" /> + <ngram occurrences="55" value="na" /> + <ngram occurrences="55" value="j" /> + <ngram occurrences="55" value="ik" /> + <ngram occurrences="54" value="d" /> + <ngram occurrences="53" value="_ku" /> + <ngram occurrences="50" value="f" /> + <ngram occurrences="50" value="at" /> + <ngram occurrences="49" value="am" /> + <ngram occurrences="49" value="_n" /> + <ngram occurrences="48" value="ya_" /> + <ngram occurrences="47" value="u_" /> + <ngram occurrences="47" value="is" /> + <ngram occurrences="46" value="hi" /> + <ngram occurrences="45" value="al" /> + <ngram occurrences="45" value="_ya" /> + <ngram occurrences="45" value="_y" /> + <ngram occurrences="45" value="_a" /> + <ngram occurrences="44" value="ki" /> + <ngram occurrences="44" value="a_w" /> + <ngram occurrences="42" value="sh" /> + <ngram occurrences="42" value="e_" /> + <ngram occurrences="41" value="ti" /> + <ngram occurrences="41" value="ta" /> + <ngram occurrences="41" value="ri" /> + <ngram occurrences="41" value="_h" /> + <ngram occurrences="39" value="il" /> + <ngram occurrences="39" value="ia" /> + <ngram occurrences="39" value="_ma" /> + <ngram occurrences="38" value="p" /> + <ngram occurrences="37" value="a_wa" /> + <ngram occurrences="37" value="_ya_" /> + <ngram occurrences="36" value="_ka" /> + <ngram occurrences="34" value="zi" /> + <ngram occurrences="34" value="ni" /> + <ngram occurrences="34" value="ng" /> + <ngram occurrences="34" value="ali" /> + <ngram occurrences="34" value="_wa_" /> + <ngram occurrences="32" value="na_" /> + <ngram occurrences="32" value="ba" /> + <ngram occurrences="31" value="ia_" /> + <ngram occurrences="31" value="ar" /> + <ngram occurrences="31" value="ak" /> + <ngram occurrences="31" value="a_ma" /> + <ngram occurrences="30" value="la" /> + <ngram occurrences="29" value="v" /> + <ngram occurrences="28" value="mb" /> + <ngram occurrences="28" value="ika" /> + <ngram occurrences="28" value="i_k" /> + <ngram occurrences="28" value="a_ku" /> + <ngram occurrences="28" value="_u" /> + <ngram occurrences="27" value="ili" /> + <ngram occurrences="27" value="ati" /> + <ngram occurrences="27" value="as" /> + <ngram occurrences="27" value="_s" /> + <ngram occurrences="26" value="ni_" /> + <ngram occurrences="26" value="in" /> + <ngram occurrences="26" value="a_n" /> + <ngram occurrences="25" value="za" /> + <ngram occurrences="25" value="li_" /> + <ngram occurrences="25" value="kw" /> + <ngram occurrences="25" value="kat" /> + <ngram occurrences="25" value="i_w" /> + <ngram occurrences="25" value="_na" /> + <ngram occurrences="24" value="se" /> + <ngram occurrences="24" value="i_wa" /> + <ngram occurrences="23" value="si" /> + <ngram occurrences="23" value="kwa" /> + <ngram occurrences="23" value="c" /> + <ngram occurrences="22" value="zi_" /> + <ngram occurrences="22" value="sa" /> + <ngram occurrences="22" value="ma_" /> + <ngram occurrences="22" value="kati" /> + <ngram occurrences="22" value="ka_" /> + <ngram occurrences="22" value="_l" /> + <ngram occurrences="21" value="ut" /> + <ngram occurrences="21" value="un" /> + <ngram occurrences="21" value="ish" /> + <ngram occurrences="21" value="hu" /> + <ngram occurrences="21" value="fa" /> + <ngram occurrences="21" value="ch" /> + <ngram occurrences="21" value="_v" /> + <ngram occurrences="21" value="_na_" /> + <ngram occurrences="21" value="_kw" /> + <ngram occurrences="20" value="nd" /> + <ngram occurrences="20" value="di" /> + <ngram occurrences="20" value="a_u" /> + <ngram occurrences="20" value="a_s" /> + <ngram occurrences="19" value="sha" /> + <ngram occurrences="19" value="mba" /> + <ngram occurrences="19" value="ja" /> + <ngram occurrences="19" value="it" /> + <ngram occurrences="19" value="ana" /> + <ngram occurrences="19" value="ai" /> + <ngram occurrences="19" value="_kwa" /> + <ngram occurrences="18" value="za_" /> + <ngram occurrences="18" value="yo" /> + <ngram occurrences="18" value="ko" /> + <ngram occurrences="18" value="ika_" /> + <ngram occurrences="18" value="er" /> + <ngram occurrences="18" value="amb" /> + <ngram occurrences="18" value="a_ya" /> + <ngram occurrences="18" value="a_y" /> + <ngram occurrences="18" value="a_a" /> + <ngram occurrences="18" value="_t" /> + <ngram occurrences="18" value="_kat" /> + <ngram occurrences="17" value="ya_k" /> + <ngram occurrences="17" value="on" /> + <ngram occurrences="17" value="kwa_" /> + <ngram occurrences="17" value="en" /> + <ngram occurrences="17" value="bi" /> + <ngram occurrences="17" value="af" /> + <ngram occurrences="17" value="_z" /> + <ngram occurrences="17" value="_ki" /> + <ngram occurrences="17" value="_i" /> + <ngram occurrences="17" value="_hi" /> + <ngram occurrences="16" value="wak" /> + <ngram occurrences="16" value="wa_m" /> + <ngram occurrences="16" value="tu" /> + <ngram occurrences="16" value="ny" /> + <ngram occurrences="16" value="mi" /> + <ngram occurrences="16" value="la_" /> + <ngram occurrences="16" value="ha_" /> + <ngram occurrences="16" value="fu" /> + <ngram occurrences="16" value="ek" /> + <ngram occurrences="16" value="ama" /> + <ngram occurrences="16" value="aj" /> + <ngram occurrences="16" value="aa" /> + <ngram occurrences="16" value="a_v" /> + <ngram occurrences="16" value="_kati" /> + <ngram occurrences="16" value="_ha" /> + <ngram occurrences="16" value="_ali" /> + <ngram occurrences="16" value="_al" /> + <ngram occurrences="15" value="um" /> + <ngram occurrences="15" value="ti_" /> + <ngram occurrences="15" value="sa_" /> + <ngram occurrences="15" value="rik" /> + <ngram occurrences="15" value="ji" /> + <ngram occurrences="15" value="iw" /> + <ngram occurrences="15" value="iki" /> + <ngram occurrences="15" value="if" /> + <ngram occurrences="15" value="he" /> + <ngram occurrences="15" value="ao" /> + <ngram occurrences="15" value="amba" /> + <ngram occurrences="15" value="a_ya_" /> + <ngram occurrences="15" value="a_ki" /> + <ngram occurrences="15" value="a_h" /> + <ngram occurrences="15" value="_wak" /> + <ngram occurrences="15" value="_la" /> + <ngram occurrences="15" value="_j" /> + <ngram occurrences="15" value="_b" /> + <ngram occurrences="14" value="wa_k" /> + <ngram occurrences="14" value="us" /> + <ngram occurrences="14" value="tik" /> + <ngram occurrences="14" value="ra" /> + <ngram occurrences="14" value="le" /> + <ngram occurrences="14" value="iz" /> + <ngram occurrences="14" value="iwa" /> + <ngram occurrences="14" value="i_wa_" /> + <ngram occurrences="14" value="i_ku" /> + <ngram occurrences="14" value="eri" /> + <ngram occurrences="14" value="em" /> + <ngram occurrences="14" value="a_ka" /> + <ngram occurrences="14" value="_ya_k" /> + <ngram occurrences="14" value="_se" /> + <ngram occurrences="13" value="wan" /> + <ngram occurrences="13" value="uu" /> + <ngram occurrences="13" value="ul" /> + <ngram occurrences="13" value="to" /> + <ngram occurrences="13" value="tika_" /> + <ngram occurrences="13" value="tika" /> + <ngram occurrences="13" value="ke" /> + <ngram occurrences="13" value="katik" /> + <ngram occurrences="13" value="i_ya" /> + <ngram occurrences="13" value="i_y" /> + <ngram occurrences="13" value="go" /> + <ngram occurrences="13" value="ga" /> + <ngram occurrences="13" value="atika" /> + <ngram occurrences="13" value="atik" /> + <ngram occurrences="13" value="ari" /> + <ngram occurrences="13" value="a_t" /> + <ngram occurrences="13" value="a_na" /> + <ngram occurrences="13" value="a_kw" /> + <ngram occurrences="13" value="_kwa_" /> + <ngram occurrences="12" value="yo_" /> + <ngram occurrences="12" value="ye" /> + <ngram occurrences="12" value="vy" /> + <ngram occurrences="12" value="ua" /> + <ngram occurrences="12" value="pi" /> + <ngram occurrences="12" value="mu" /> + <ngram occurrences="12" value="mk" /> + <ngram occurrences="12" value="kut" /> + <ngram occurrences="12" value="ini" /> + <ngram occurrences="12" value="ili_" /> + <ngram occurrences="12" value="ho" /> + <ngram occurrences="12" value="ao_" /> + <ngram occurrences="12" value="a_kwa" /> + <ngram occurrences="12" value="_za" /> + <ngram occurrences="12" value="_mk" /> + <ngram occurrences="11" value="we" /> + <ngram occurrences="11" value="wal" /> + <ngram occurrences="11" value="vi" /> + <ngram occurrences="11" value="uwa" /> + <ngram occurrences="11" value="uw" /> + <ngram occurrences="11" value="uu_" /> + <ngram occurrences="11" value="sha_" /> + <ngram occurrences="11" value="no" /> + <ngram occurrences="11" value="ndi" /> + <ngram occurrences="11" value="mo" /> + <ngram occurrences="11" value="kuwa" /> + <ngram occurrences="11" value="kuw" /> + <ngram occurrences="11" value="kam" /> + <ngram occurrences="11" value="iy" /> + <ngram occurrences="11" value="iwa_" /> + <ngram occurrences="11" value="im" /> + <ngram occurrences="11" value="ifa" /> + <ngram occurrences="11" value="i_z" /> + <ngram occurrences="11" value="i_ya_" /> + <ngram occurrences="11" value="i_m" /> + <ngram occurrences="11" value="fa_" /> + <ngram occurrences="11" value="di_" /> + <ngram occurrences="11" value="da" /> + <ngram occurrences="11" value="az" /> + <ngram occurrences="11" value="aw" /> + <ngram occurrences="11" value="ali_" /> + <ngram occurrences="11" value="aki" /> + <ngram occurrences="11" value="ad" /> + <ngram occurrences="11" value="a_na_" /> + <ngram occurrences="11" value="a_hi" /> + <ngram occurrences="11" value="_ta" /> + <ngram occurrences="11" value="_am" /> + <ngram occurrences="10" value="zi_w" /> + <ngram occurrences="10" value="ya_ki" /> + <ngram occurrences="10" value="wa_n" /> + <ngram occurrences="10" value="wa_ma" /> + <ngram occurrences="10" value="uz" /> + <ngram occurrences="10" value="uta" /> + <ngram occurrences="10" value="uh" /> + <ngram occurrences="10" value="rika" /> + <ngram occurrences="10" value="pa" /> + <ngram occurrences="10" value="ot" /> + <ngram occurrences="10" value="o_h" /> + <ngram occurrences="10" value="no_" /> + <ngram occurrences="10" value="me" /> + <ngram occurrences="10" value="iyo" /> + <ngram occurrences="10" value="ini_" /> + <ngram occurrences="10" value="ifa_" /> + <ngram occurrences="10" value="ge" /> + <ngram occurrences="10" value="ez" /> + <ngram occurrences="10" value="es" /> + <ngram occurrences="10" value="ba_" /> + <ngram occurrences="10" value="ay" /> + <ngram occurrences="10" value="au" /> + <ngram occurrences="10" value="ang" /> + <ngram occurrences="10" value="ah" /> + <ngram occurrences="10" value="ab" /> + <ngram occurrences="10" value="a_vi" /> + <ngram occurrences="10" value="a_se" /> + <ngram occurrences="10" value="_vy" /> + <ngram occurrences="10" value="_vi" /> + <ngram occurrences="10" value="_p" /> + <ngram occurrences="10" value="_kam" /> + <ngram occurrences="9" value="zo" /> + <ngram occurrences="9" value="zi_wa" /> + <ngram occurrences="9" value="wana" /> + <ngram occurrences="9" value="wa_w" /> + <ngram occurrences="9" value="vya" /> + <ngram occurrences="9" value="ur" /> + <ngram occurrences="9" value="uo" /> + <ngram occurrences="9" value="u_wa" /> + <ngram occurrences="9" value="u_w" /> + <ngram occurrences="9" value="th" /> + <ngram occurrences="9" value="o_wa" /> + <ngram occurrences="9" value="o_w" /> + <ngram occurrences="9" value="o_k" /> + <ngram occurrences="9" value="o_a" /> + <ngram occurrences="9" value="nj" /> + <ngram occurrences="9" value="ngo" /> + <ngram occurrences="9" value="nga" /> + <ngram occurrences="9" value="mar" /> + <ngram occurrences="9" value="lis" /> + <ngram occurrences="9" value="kuu" /> + <ngram occurrences="9" value="kis" /> + <ngram occurrences="9" value="ki_" /> + <ngram occurrences="9" value="je" /> + <ngram occurrences="9" value="ip" /> + <ngram occurrences="9" value="iki_" /> + <ngram occurrences="9" value="id" /> + <ngram occurrences="9" value="ib" /> + <ngram occurrences="9" value="i_ka" /> + <ngram occurrences="9" value="i_a" /> + <ngram occurrences="9" value="ho_" /> + <ngram occurrences="9" value="hi_" /> + <ngram occurrences="9" value="gu" /> + <ngram occurrences="9" value="dh" /> + <ngram occurrences="9" value="cha" /> + <ngram occurrences="9" value="ani" /> + <ngram occurrences="9" value="ana_" /> + <ngram occurrences="9" value="ama_" /> + <ngram occurrences="9" value="ag" /> + <ngram occurrences="9" value="a_wak" /> + <ngram occurrences="9" value="a_wa_" /> + <ngram occurrences="9" value="a_mk" /> + <ngram occurrences="9" value="a_l" /> + <ngram occurrences="9" value="a_b" /> + <ngram occurrences="9" value="_vya" /> + <ngram occurrences="9" value="_la_" /> + <ngram occurrences="8" value="wi" /> + <ngram occurrences="8" value="wa_s" /> + <ngram occurrences="8" value="uwa_" /> + <ngram occurrences="8" value="ung" /> + <ngram occurrences="8" value="tu_" /> + <ngram occurrences="8" value="ta_" /> + <ngram occurrences="8" value="su" /> + <ngram occurrences="8" value="sem" /> + <ngram occurrences="8" value="ok" /> + <ngram occurrences="8" value="nz" /> + <ngram occurrences="8" value="mku" /> + <ngram occurrences="8" value="kuwa_" /> + <ngram occurrences="8" value="kuu_" /> + <ngram occurrences="8" value="kali_" /> + <ngram occurrences="8" value="kali" /> + <ngram occurrences="8" value="kal" /> + <ngram occurrences="8" value="ju" /> + <ngram occurrences="8" value="isha" /> + <ngram occurrences="8" value="i_za" /> + <ngram occurrences="8" value="ema_" /> + <ngram occurrences="8" value="ema" /> + <ngram occurrences="8" value="eke" /> + <ngram occurrences="8" value="bw" /> + <ngram occurrences="8" value="azi" /> + <ngram occurrences="8" value="awa" /> + <ngram occurrences="8" value="atu" /> + <ngram occurrences="8" value="ati_" /> + <ngram occurrences="8" value="ata" /> + <ngram occurrences="8" value="asi" /> + <ngram occurrences="8" value="aka" /> + <ngram occurrences="8" value="aji" /> + <ngram occurrences="8" value="a_ta" /> + <ngram occurrences="8" value="a_mar" /> + <ngram occurrences="8" value="a_j" /> + <ngram occurrences="8" value="_za_" /> + <ngram occurrences="8" value="_r" /> + <ngram occurrences="8" value="_ni" /> + <ngram occurrences="8" value="_mku" /> + <ngram occurrences="8" value="_mar" /> + <ngram occurrences="8" value="_kut" /> + <ngram occurrences="8" value="_amba" /> + <ngram occurrences="8" value="_amb" /> + <ngram occurrences="7" value="ye_" /> + <ngram occurrences="7" value="wam" /> + <ngram occurrences="7" value="wali" /> + <ngram occurrences="7" value="w_" /> + <ngram occurrences="7" value="uo_" /> + <ngram occurrences="7" value="uli" /> + <ngram occurrences="7" value="uhu" /> + <ngram occurrences="7" value="uf" /> + <ngram occurrences="7" value="te" /> + <ngram occurrences="7" value="serik" /> + <ngram occurrences="7" value="seri" /> + <ngram occurrences="7" value="ser" /> + <ngram occurrences="7" value="sema_" /> + <ngram occurrences="7" value="sema" /> + <ngram occurrences="7" value="rikal" /> +</ngrams> diff --git a/src/plugins/language/tagalog.klp b/src/plugins/language/tagalog.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="874" value="a" /> + <ngram occurrences="786" value="_" /> + <ngram occurrences="480" value="n" /> + <ngram occurrences="346" value="i" /> + <ngram occurrences="303" value="g" /> + <ngram occurrences="211" value="ng" /> + <ngram occurrences="210" value="a_" /> + <ngram occurrences="192" value="g_" /> + <ngram occurrences="184" value="t" /> + <ngram occurrences="180" value="ng_" /> + <ngram occurrences="175" value="o" /> + <ngram occurrences="167" value="k" /> + <ngram occurrences="163" value="an" /> + <ngram occurrences="163" value="_n" /> + <ngram occurrences="162" value="s" /> + <ngram occurrences="147" value="l" /> + <ngram occurrences="142" value="m" /> + <ngram occurrences="121" value="p" /> + <ngram occurrences="113" value="na" /> + <ngram occurrences="105" value="y" /> + <ngram occurrences="104" value="u" /> + <ngram occurrences="102" value="ang" /> + <ngram occurrences="100" value="_a" /> + <ngram occurrences="93" value="ang_" /> + <ngram occurrences="84" value="in" /> + <ngram occurrences="82" value="ka" /> + <ngram occurrences="82" value="_na" /> + <ngram occurrences="81" value="_s" /> + <ngram occurrences="81" value="_m" /> + <ngram occurrences="80" value="o_" /> + <ngram occurrences="80" value="la" /> + <ngram occurrences="79" value="b" /> + <ngram occurrences="77" value="r" /> + <ngram occurrences="74" value="pa" /> + <ngram occurrences="74" value="ma" /> + <ngram occurrences="73" value="sa" /> + <ngram occurrences="71" value="_p" /> + <ngram occurrences="70" value="ak" /> + <ngram occurrences="67" value="n_" /> + <ngram occurrences="67" value="h" /> + <ngram occurrences="61" value="_k" /> + <ngram occurrences="59" value="d" /> + <ngram occurrences="59" value="al" /> + <ngram occurrences="57" value="t_" /> + <ngram occurrences="55" value="at" /> + <ngram occurrences="52" value="ag" /> + <ngram occurrences="51" value="_sa" /> + <ngram occurrences="51" value="_pa" /> + <ngram occurrences="50" value="ta" /> + <ngram occurrences="48" value="sa_" /> + <ngram occurrences="47" value="ni" /> + <ngram occurrences="47" value="_ng" /> + <ngram occurrences="45" value="_ma" /> + <ngram occurrences="42" value="ya" /> + <ngram occurrences="41" value="it" /> + <ngram occurrences="41" value="ay" /> + <ngram occurrences="41" value="_sa_" /> + <ngram occurrences="41" value="_ka" /> + <ngram occurrences="41" value="_an" /> + <ngram occurrences="40" value="e" /> + <ngram occurrences="40" value="_i" /> + <ngram occurrences="39" value="y_" /> + <ngram occurrences="39" value="on" /> + <ngram occurrences="38" value="na_" /> + <ngram occurrences="37" value="w" /> + <ngram occurrences="37" value="il" /> + <ngram occurrences="37" value="i_" /> + <ngram occurrences="37" value="ga" /> + <ngram occurrences="37" value="ala" /> + <ngram occurrences="37" value="_ng_" /> + <ngram occurrences="36" value="iy" /> + <ngram occurrences="34" value="an_" /> + <ngram occurrences="34" value="_t" /> + <ngram occurrences="34" value="_ang_" /> + <ngram occurrences="34" value="_ang" /> + <ngram occurrences="33" value="ba" /> + <ngram occurrences="33" value="_ni" /> + <ngram occurrences="32" value="am" /> + <ngram occurrences="32" value="_na_" /> + <ngram occurrences="31" value="ra" /> + <ngram occurrences="30" value="ha" /> + <ngram occurrences="30" value="a_s" /> + <ngram occurrences="30" value="_l" /> + <ngram occurrences="29" value="s_" /> + <ngram occurrences="29" value="iya" /> + <ngram occurrences="29" value="ar" /> + <ngram occurrences="28" value="is" /> + <ngram occurrences="28" value="hi" /> + <ngram occurrences="27" value="ya_" /> + <ngram occurrences="27" value="ong" /> + <ngram occurrences="27" value="li" /> + <ngram occurrences="27" value="aka" /> + <ngram occurrences="26" value="ong_" /> + <ngram occurrences="26" value="ko" /> + <ngram occurrences="26" value="as" /> + <ngram occurrences="25" value="to" /> + <ngram occurrences="25" value="si" /> + <ngram occurrences="25" value="ri" /> + <ngram occurrences="25" value="ap" /> + <ngram occurrences="25" value="a_p" /> + <ngram occurrences="25" value="a_n" /> + <ngram occurrences="25" value="_b" /> + <ngram occurrences="24" value="wa" /> + <ngram occurrences="24" value="un" /> + <ngram occurrences="24" value="lan" /> + <ngram occurrences="24" value="gi" /> + <ngram occurrences="24" value="di" /> + <ngram occurrences="24" value="ay_" /> + <ngram occurrences="24" value="ah" /> + <ngram occurrences="24" value="a_a" /> + <ngram occurrences="23" value="um" /> + <ngram occurrences="23" value="iya_" /> + <ngram occurrences="23" value="ing" /> + <ngram occurrences="23" value="ata" /> + <ngram occurrences="23" value="_d" /> + <ngram occurrences="22" value="ti" /> + <ngram occurrences="22" value="ki" /> + <ngram occurrences="22" value="at_" /> + <ngram occurrences="21" value="niya" /> + <ngram occurrences="21" value="niy" /> + <ngram occurrences="21" value="n_n" /> + <ngram occurrences="21" value="mo" /> + <ngram occurrences="21" value="in_" /> + <ngram occurrences="21" value="ab" /> + <ngram occurrences="21" value="_niya" /> + <ngram occurrences="21" value="_niy" /> + <ngram occurrences="21" value="_ak" /> + <ngram occurrences="20" value="ng_p" /> + <ngram occurrences="20" value="la_" /> + <ngram occurrences="20" value="ila" /> + <ngram occurrences="20" value="g_p" /> + <ngram occurrences="20" value="a_m" /> + <ngram occurrences="19" value="yo" /> + <ngram occurrences="19" value="nag" /> + <ngram occurrences="19" value="g_m" /> + <ngram occurrences="19" value="aw" /> + <ngram occurrences="19" value="a_sa" /> + <ngram occurrences="19" value="_mo" /> + <ngram occurrences="19" value="_h" /> + <ngram occurrences="18" value="ot" /> + <ngram occurrences="18" value="ng_m" /> + <ngram occurrences="18" value="lang" /> + <ngram occurrences="18" value="ig" /> + <ngram occurrences="18" value="g_n" /> + <ngram occurrences="18" value="a_pa" /> + <ngram occurrences="18" value="_si" /> + <ngram occurrences="17" value="tu" /> + <ngram occurrences="17" value="ng_t" /> + <ngram occurrences="17" value="ng_n" /> + <ngram occurrences="17" value="ing_" /> + <ngram occurrences="17" value="g_t" /> + <ngram occurrences="17" value="g_a" /> + <ngram occurrences="17" value="_at" /> + <ngram occurrences="16" value="y_n" /> + <ngram occurrences="16" value="t_n" /> + <ngram occurrences="16" value="ot_" /> + <ngram occurrences="16" value="niya_" /> + <ngram occurrences="16" value="nga" /> + <ngram occurrences="16" value="ng_i" /> + <ngram occurrences="16" value="ng_a" /> + <ngram occurrences="16" value="mo_" /> + <ngram occurrences="16" value="ina" /> + <ngram occurrences="16" value="g_i" /> + <ngram occurrences="16" value="ara" /> + <ngram occurrences="16" value="ama" /> + <ngram occurrences="16" value="ali" /> + <ngram occurrences="16" value="ako" /> + <ngram occurrences="16" value="aki" /> + <ngram occurrences="16" value="a_sa_" /> + <ngram occurrences="16" value="_mo_" /> + <ngram occurrences="16" value="_at_" /> + <ngram occurrences="15" value="to_" /> + <ngram occurrences="15" value="o_n" /> + <ngram occurrences="15" value="ng_s" /> + <ngram occurrences="15" value="nd" /> + <ngram occurrences="15" value="lang_" /> + <ngram occurrences="15" value="ka_" /> + <ngram occurrences="15" value="ga_" /> + <ngram occurrences="15" value="g_s" /> + <ngram occurrences="15" value="g_k" /> + <ngram occurrences="15" value="bi" /> + <ngram occurrences="15" value="aa" /> + <ngram occurrences="14" value="y_na" /> + <ngram occurrences="14" value="o_a" /> + <ngram occurrences="14" value="n_m" /> + <ngram occurrences="14" value="ko_" /> + <ngram occurrences="14" value="ib" /> + <ngram occurrences="14" value="g_l" /> + <ngram occurrences="14" value="da" /> + <ngram occurrences="14" value="ai" /> + <ngram occurrences="14" value="a_k" /> + <ngram occurrences="14" value="_r" /> + <ngram occurrences="14" value="_la" /> + <ngram occurrences="13" value="su" /> + <ngram occurrences="13" value="ro" /> + <ngram occurrences="13" value="pi" /> + <ngram occurrences="13" value="pa_" /> + <ngram occurrences="13" value="o_s" /> + <ngram occurrences="13" value="ng_l" /> + <ngram occurrences="13" value="mag" /> + <ngram occurrences="13" value="lo" /> + <ngram occurrences="13" value="l_" /> + <ngram occurrences="13" value="ito" /> + <ngram occurrences="13" value="it_" /> + <ngram occurrences="13" value="ik" /> + <ngram occurrences="13" value="hin" /> + <ngram occurrences="13" value="a_ma" /> + <ngram occurrences="13" value="_ta" /> + <ngram occurrences="13" value="_is" /> + <ngram occurrences="12" value="ul" /> + <ngram occurrences="12" value="rin" /> + <ngram occurrences="12" value="pan" /> + <ngram occurrences="12" value="nak" /> + <ngram occurrences="12" value="n_a" /> + <ngram occurrences="12" value="mi" /> + <ngram occurrences="12" value="ito_" /> + <ngram occurrences="12" value="is_" /> + <ngram occurrences="12" value="ilan" /> + <ngram occurrences="12" value="i_n" /> + <ngram occurrences="12" value="g_na" /> + <ngram occurrences="12" value="e_" /> + <ngram occurrences="12" value="an_n" /> + <ngram occurrences="12" value="ahi" /> + <ngram occurrences="12" value="a_ka" /> + <ngram occurrences="12" value="_y" /> + <ngram occurrences="12" value="_tu" /> + <ngram occurrences="12" value="_nag" /> + <ngram occurrences="12" value="_mag" /> + <ngram occurrences="12" value="_di" /> + <ngram occurrences="12" value="_ba" /> + <ngram occurrences="11" value="wala" /> + <ngram occurrences="11" value="wal" /> + <ngram occurrences="11" value="ung" /> + <ngram occurrences="11" value="sa_p" /> + <ngram occurrences="11" value="on_" /> + <ngram occurrences="11" value="ng_pa" /> + <ngram occurrences="11" value="ng_na" /> + <ngram occurrences="11" value="ng_k" /> + <ngram occurrences="11" value="man" /> + <ngram occurrences="11" value="lu" /> + <ngram occurrences="11" value="kin" /> + <ngram occurrences="11" value="k_" /> + <ngram occurrences="11" value="go" /> + <ngram occurrences="11" value="gk" /> + <ngram occurrences="11" value="g_pa" /> + <ngram occurrences="11" value="apa" /> + <ngram occurrences="11" value="ang_s" /> + <ngram occurrences="11" value="alan" /> + <ngram occurrences="11" value="a_l" /> + <ngram occurrences="11" value="_y_" /> + <ngram occurrences="11" value="_ri" /> + <ngram occurrences="11" value="_ako" /> + <ngram occurrences="10" value="yon" /> + <ngram occurrences="10" value="yan" /> + <ngram occurrences="10" value="uma" /> + <ngram occurrences="10" value="ra_" /> + <ngram occurrences="10" value="pu" /> + <ngram occurrences="10" value="p_" /> + <ngram occurrences="10" value="nan" /> + <ngram occurrences="10" value="naka" /> + <ngram occurrences="10" value="mu" /> + <ngram occurrences="10" value="mga_" /> + <ngram occurrences="10" value="mga" /> + <ngram occurrences="10" value="mg" /> + <ngram occurrences="10" value="isa" /> + <ngram occurrences="10" value="ir" /> + <ngram occurrences="10" value="ini" /> + <ngram occurrences="10" value="ilang" /> + <ngram occurrences="10" value="g_ma" /> + <ngram occurrences="10" value="di_" /> + <ngram occurrences="10" value="awa" /> + <ngram occurrences="10" value="asa" /> + <ngram occurrences="10" value="as_" /> + <ngram occurrences="10" value="ari" /> + <ngram occurrences="10" value="ang_n" /> + <ngram occurrences="10" value="ang_a" /> + <ngram occurrences="10" value="akin" /> + <ngram occurrences="10" value="agk" /> + <ngram occurrences="10" value="a_ng" /> + <ngram occurrences="10" value="a_na" /> + <ngram occurrences="10" value="_w" /> + <ngram occurrences="10" value="_mga_" /> + <ngram occurrences="10" value="_mga" /> + <ngram occurrences="10" value="_mg" /> + <ngram occurrences="10" value="_ka_" /> + <ngram occurrences="10" value="_isa" /> + <ngram occurrences="10" value="_ha" /> + <ngram occurrences="9" value="sa_pa" /> + <ngram occurrences="9" value="pag" /> + <ngram occurrences="9" value="o_sa_" /> + <ngram occurrences="9" value="o_sa" /> + <ngram occurrences="9" value="no" /> + <ngram occurrences="9" value="ng_ma" /> + <ngram occurrences="9" value="ng_ka" /> + <ngram occurrences="9" value="ng_d" /> + <ngram occurrences="9" value="may_" /> + <ngram occurrences="9" value="may" /> + <ngram occurrences="9" value="ku" /> + <ngram occurrences="9" value="in_m" /> + <ngram occurrences="9" value="gka" /> + <ngram occurrences="9" value="g_ka" /> + <ngram occurrences="9" value="g_d" /> + <ngram occurrences="9" value="d_" /> + <ngram occurrences="9" value="and" /> + <ngram occurrences="9" value="ala_" /> + <ngram occurrences="9" value="ako_" /> + <ngram occurrences="9" value="agka" /> + <ngram occurrences="9" value="aba" /> + <ngram occurrences="9" value="a_t" /> + <ngram occurrences="9" value="a_si" /> + <ngram occurrences="9" value="a_ri" /> + <ngram occurrences="9" value="a_r" /> + <ngram occurrences="9" value="a_i" /> + <ngram occurrences="9" value="a_b" /> + <ngram occurrences="9" value="a_ak" /> + <ngram occurrences="9" value="_wala" /> + <ngram occurrences="9" value="_wal" /> + <ngram occurrences="9" value="_wa" /> + <ngram occurrences="9" value="_pa_" /> + <ngram occurrences="9" value="_nak" /> + <ngram occurrences="9" value="_lu" /> + <ngram occurrences="9" value="_ku" /> + <ngram occurrences="9" value="_ako_" /> + <ngram occurrences="9" value="_akin" /> + <ngram occurrences="9" value="_aki" /> + <ngram occurrences="8" value="yang_" /> + <ngram occurrences="8" value="yang" /> + <ngram occurrences="8" value="ya_s" /> + <ngram occurrences="8" value="ut" /> + <ngram occurrences="8" value="umi" /> + <ngram occurrences="8" value="tay" /> + <ngram occurrences="8" value="tan" /> + <ngram occurrences="8" value="t_na" /> + <ngram occurrences="8" value="si_" /> + <ngram occurrences="8" value="san" /> + <ngram occurrences="8" value="s_n" /> + <ngram occurrences="8" value="ro_" /> + <ngram occurrences="8" value="pak" /> + <ngram occurrences="8" value="oo" /> + <ngram occurrences="8" value="o_na" /> + <ngram occurrences="8" value="o_an" /> + <ngram occurrences="8" value="na_m" /> + <ngram occurrences="8" value="n_ng" /> + <ngram occurrences="8" value="n_na" /> + <ngram occurrences="8" value="mat" /> + <ngram occurrences="8" value="king" /> + <ngram occurrences="8" value="kas" /> + <ngram occurrences="8" value="k_n" /> + <ngram occurrences="8" value="iti" /> + <ngram occurrences="8" value="ip" /> + <ngram occurrences="8" value="ili" /> + <ngram occurrences="8" value="igi" /> + <ngram occurrences="8" value="dib" /> + <ngram occurrences="8" value="bu" /> + <ngram occurrences="8" value="b_" /> + <ngram occurrences="8" value="ayo" /> + <ngram occurrences="8" value="ay_n" /> + <ngram occurrences="8" value="ang_t" /> + <ngram occurrences="8" value="ang_p" /> + <ngram occurrences="8" value="aman" /> + <ngram occurrences="8" value="alang" /> + <ngram occurrences="8" value="aking" /> + <ngram occurrences="8" value="aha" /> + <ngram occurrences="8" value="aga" /> + <ngram occurrences="8" value="abi" /> + <ngram occurrences="8" value="_su" /> + <ngram occurrences="8" value="_pu" /> + <ngram occurrences="8" value="_pag" /> + <ngram occurrences="8" value="_ng_m" /> + <ngram occurrences="8" value="_naka" /> + <ngram occurrences="8" value="_may_" /> + <ngram occurrences="8" value="_may" /> + <ngram occurrences="8" value="_hi" /> + <ngram occurrences="7" value="yo_" /> + <ngram occurrences="7" value="y_a" /> + <ngram occurrences="7" value="walan" /> + <ngram occurrences="7" value="tum" /> + <ngram occurrences="7" value="tin" /> + <ngram occurrences="7" value="tat" /> + <ngram occurrences="7" value="tang" /> + <ngram occurrences="7" value="tak" /> + <ngram occurrences="7" value="t_m" /> + <ngram occurrences="7" value="s_an" /> + <ngram occurrences="7" value="s_a" /> + <ngram occurrences="7" value="rin_" /> + <ngram occurrences="7" value="ram" /> + <ngram occurrences="7" value="pin" /> + <ngram occurrences="7" value="par" /> + <ngram occurrences="7" value="pal" /> + <ngram occurrences="7" value="ob" /> + <ngram occurrences="7" value="o_y" /> + <ngram occurrences="7" value="o_m" /> + <ngram occurrences="7" value="ng_tu" /> + <ngram occurrences="7" value="ng_sa" /> + <ngram occurrences="7" value="ng_mg" /> + <ngram occurrences="7" value="ng_lu" /> + <ngram occurrences="7" value="ng_is" /> + <ngram occurrences="7" value="ng_h" /> + <ngram occurrences="7" value="ng_b" /> + <ngram occurrences="7" value="ng_ak" /> +</ngrams> diff --git a/src/plugins/language/tamil.klp b/src/plugins/language/tamil.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1111" value="_" /> + <ngram occurrences="357" value="õ" /> + <ngram occurrences="281" value="ô" /> + <ngram occurrences="213" value="½" /> + <ngram occurrences="195" value="â" /> + <ngram occurrences="194" value="¸" /> + <ngram occurrences="156" value="õ_" /> + <ngram occurrences="154" value="_½" /> + <ngram occurrences="140" value="ÿ" /> + <ngram occurrences="128" value="à" /> + <ngram occurrences="120" value="_õ" /> + <ngram occurrences="116" value="ù" /> + <ngram occurrences="115" value="ç" /> + <ngram occurrences="109" value="ø" /> + <ngram occurrences="95" value="ô_" /> + <ngram occurrences="93" value="¨" /> + <ngram occurrences="93" value="å" /> + <ngram occurrences="87" value="á" /> + <ngram occurrences="81" value="æ" /> + <ngram occurrences="76" value="_¸" /> + <ngram occurrences="74" value="â_" /> + <ngram occurrences="74" value="_â" /> + <ngram occurrences="70" value="_ø" /> + <ngram occurrences="69" value="ÿ_" /> + <ngram occurrences="68" value="é" /> + <ngram occurrences="68" value="¹" /> + <ngram occurrences="68" value="_ô" /> + <ngram occurrences="64" value="½ô" /> + <ngram occurrences="62" value="ä" /> + <ngram occurrences="61" value="_õ_" /> + <ngram occurrences="61" value="_ç" /> + <ngram occurrences="58" value="à_" /> + <ngram occurrences="58" value="_é" /> + <ngram occurrences="56" value="¸_" /> + <ngram occurrences="51" value="_ÿ" /> + <ngram occurrences="50" value="þ" /> + <ngram occurrences="50" value="ç_" /> + <ngram occurrences="45" value="¨_" /> + <ngram occurrences="45" value="õ¸" /> + <ngram occurrences="44" value="_þ" /> + <ngram occurrences="42" value="í" /> + <ngram occurrences="40" value="½_" /> + <ngram occurrences="39" value="¸õ" /> + <ngram occurrences="39" value="æ_" /> + <ngram occurrences="39" value="á_" /> + <ngram occurrences="37" value="þ_" /> + <ngram occurrences="36" value="âõ" /> + <ngram occurrences="35" value="ü" /> + <ngram occurrences="35" value="ª" /> + <ngram occurrences="35" value="_½ô" /> + <ngram occurrences="35" value="_ù" /> + <ngram occurrences="34" value="ö" /> + <ngram occurrences="34" value="å_" /> + <ngram occurrences="34" value="_í" /> + <ngram occurrences="33" value="ø½" /> + <ngram occurrences="32" value="_å" /> + <ngram occurrences="31" value="ó" /> + <ngram occurrences="31" value="¹_" /> + <ngram occurrences="31" value="_þ_" /> + <ngram occurrences="30" value="¸ô" /> + <ngram occurrences="30" value="_ø½" /> + <ngram occurrences="29" value="½õ" /> + <ngram occurrences="28" value="ÿô" /> + <ngram occurrences="28" value="ý" /> + <ngram occurrences="27" value="é_" /> + <ngram occurrences="26" value="ô¸" /> + <ngram occurrences="26" value="ô¨" /> + <ngram occurrences="26" value="è" /> + <ngram occurrences="26" value="_½_" /> + <ngram occurrences="26" value="_à" /> + <ngram occurrences="25" value="ä_" /> + <ngram occurrences="25" value="àõ" /> + <ngram occurrences="25" value="_½õ" /> + <ngram occurrences="24" value="½à" /> + <ngram occurrences="24" value="õ_½" /> + <ngram occurrences="24" value="º" /> + <ngram occurrences="24" value="ª_" /> + <ngram occurrences="24" value="_á" /> + <ngram occurrences="23" value="ü_" /> + <ngram occurrences="23" value="ùá" /> + <ngram occurrences="23" value="ë" /> + <ngram occurrences="23" value="ã" /> + <ngram occurrences="22" value="¸ª_" /> + <ngram occurrences="22" value="¸ª" /> + <ngram occurrences="22" value="ø½ô" /> + <ngram occurrences="22" value="_è" /> + <ngram occurrences="21" value="ù_" /> + <ngram occurrences="21" value="ô¨_" /> + <ngram occurrences="21" value="_¸ô" /> + <ngram occurrences="21" value="_âõ" /> + <ngram occurrences="20" value="õ¨" /> + <ngram occurrences="20" value="_ø½ô" /> + <ngram occurrences="20" value="_é_" /> + <ngram occurrences="19" value="ì" /> + <ngram occurrences="19" value="âô" /> + <ngram occurrences="19" value="_ä" /> + <ngram occurrences="18" value="½ô_" /> + <ngram occurrences="18" value="ÿ_õ" /> + <ngram occurrences="18" value="ø_" /> + <ngram occurrences="18" value="ó_" /> + <ngram occurrences="18" value="î" /> + <ngram occurrences="18" value="àõ_" /> + <ngram occurrences="18" value="_½à" /> + <ngram occurrences="18" value="_ÿô" /> + <ngram occurrences="18" value="_ô¨" /> + <ngram occurrences="18" value="_î" /> + <ngram occurrences="18" value="_¹" /> + <ngram occurrences="17" value="õç" /> + <ngram occurrences="17" value="ô¸_" /> + <ngram occurrences="17" value="ôà" /> + <ngram occurrences="17" value="_à_" /> + <ngram occurrences="16" value="õ¸_" /> + <ngram occurrences="16" value="õà" /> + <ngram occurrences="16" value="ôõ" /> + <ngram occurrences="16" value="ôæ" /> + <ngram occurrences="16" value="í_" /> + <ngram occurrences="16" value="æõ" /> + <ngram occurrences="16" value="âõ_" /> + <ngram occurrences="16" value="_ô¨_" /> + <ngram occurrences="15" value="½¹" /> + <ngram occurrences="15" value="õæ" /> + <ngram occurrences="15" value="ôõ¸" /> + <ngram occurrences="15" value="í¨" /> + <ngram occurrences="15" value="æô" /> + <ngram occurrences="15" value="åõ" /> + <ngram occurrences="15" value="_¸õ" /> + <ngram occurrences="15" value="_½¹" /> + <ngram occurrences="15" value="_ô_" /> + <ngram occurrences="15" value="_í¨" /> + <ngram occurrences="15" value="_ë" /> + <ngram occurrences="15" value="_å_" /> + <ngram occurrences="15" value="_â_" /> + <ngram occurrences="14" value="¨å" /> + <ngram occurrences="14" value="ùá_" /> + <ngram occurrences="14" value="õå" /> + <ngram occurrences="14" value="ôâ" /> + <ngram occurrences="14" value="ô_¸" /> + <ngram occurrences="14" value="ì_" /> + <ngram occurrences="14" value="éç" /> + <ngram occurrences="14" value="åô" /> + <ngram occurrences="14" value="ß" /> + <ngram occurrences="14" value="_õ_½" /> + <ngram occurrences="14" value="_éç" /> + <ngram occurrences="14" value="_ç_" /> + <ngram occurrences="13" value="ÿõ" /> + <ngram occurrences="13" value="õ_¸" /> + <ngram occurrences="13" value="ð" /> + <ngram occurrences="13" value="ë_" /> + <ngram occurrences="13" value="â_½" /> + <ngram occurrences="13" value="_¸_" /> + <ngram occurrences="13" value="_½ô_" /> + <ngram occurrences="13" value="_ùá" /> + <ngram occurrences="13" value="_ð" /> + <ngram occurrences="13" value="_æ" /> + <ngram occurrences="12" value="ÿô_" /> + <ngram occurrences="12" value="ÿ_õ_" /> + <ngram occurrences="12" value="ùÿ" /> + <ngram occurrences="12" value="öó" /> + <ngram occurrences="12" value="õù" /> + <ngram occurrences="12" value="õ_ù" /> + <ngram occurrences="12" value="õ_õ" /> + <ngram occurrences="12" value="ôæ_" /> + <ngram occurrences="12" value="ô_õ" /> + <ngram occurrences="12" value="çÿ" /> + <ngram occurrences="12" value="çù" /> + <ngram occurrences="12" value="áõ" /> + <ngram occurrences="12" value="áô" /> + <ngram occurrences="12" value="à_õ" /> + <ngram occurrences="12" value="o" /> + <ngram occurrences="11" value="¸õå" /> + <ngram occurrences="11" value="¨ì_" /> + <ngram occurrences="11" value="¨ì" /> + <ngram occurrences="11" value="½ü" /> + <ngram occurrences="11" value="½_õ" /> + <ngram occurrences="11" value="ùâ" /> + <ngram occurrences="11" value="øÿ" /> + <ngram occurrences="11" value="øâ" /> + <ngram occurrences="11" value="õç_" /> + <ngram occurrences="11" value="õá" /> + <ngram occurrences="11" value="éç_" /> + <ngram occurrences="11" value="çâ" /> + <ngram occurrences="11" value="àô" /> + <ngram occurrences="11" value="º_" /> + <ngram occurrences="11" value="i" /> + <ngram occurrences="11" value="_½ü" /> + <ngram occurrences="11" value="_ÿ_" /> + <ngram occurrences="11" value="_éç_" /> + <ngram occurrences="11" value="_çù" /> + <ngram occurrences="11" value="_ä_" /> + <ngram occurrences="10" value="ù¸" /> + <ngram occurrences="10" value="ö_" /> + <ngram occurrences="10" value="õ_ø" /> + <ngram occurrences="10" value="õ_ô" /> + <ngram occurrences="10" value="õ_ç" /> + <ngram occurrences="10" value="ôõ¸_" /> + <ngram occurrences="10" value="éÿ_" /> + <ngram occurrences="10" value="éÿ" /> + <ngram occurrences="10" value="çà" /> + <ngram occurrences="10" value="æô_" /> + <ngram occurrences="10" value="åõ_" /> + <ngram occurrences="10" value="äõ" /> + <ngram occurrences="10" value="â_ø" /> + <ngram occurrences="10" value="ß_" /> + <ngram occurrences="10" value="¹ô" /> + <ngram occurrences="10" value="r" /> + <ngram occurrences="10" value="e" /> + <ngram occurrences="10" value="a" /> + <ngram occurrences="10" value="_ùá_" /> + <ngram occurrences="10" value="_õà" /> + <ngram occurrences="10" value="_éÿ_" /> + <ngram occurrences="10" value="_éÿ" /> + <ngram occurrences="10" value="_çà" /> + <ngram occurrences="9" value="¸ù" /> + <ngram occurrences="9" value="¸ä" /> + <ngram occurrences="9" value="¸_½" /> + <ngram occurrences="9" value="¨_½" /> + <ngram occurrences="9" value="½à_" /> + <ngram occurrences="9" value="ÿ_½" /> + <ngram occurrences="9" value="ùÿ_" /> + <ngram occurrences="9" value="ùä" /> + <ngram occurrences="9" value="ù_½" /> + <ngram occurrences="9" value="öó_" /> + <ngram occurrences="9" value="ôá" /> + <ngram occurrences="9" value="î_" /> + <ngram occurrences="9" value="ê" /> + <ngram occurrences="9" value="çÿ_" /> + <ngram occurrences="9" value="ç_þ" /> + <ngram occurrences="9" value="ã_" /> + <ngram occurrences="9" value="âù" /> + <ngram occurrences="9" value="ââ" /> + <ngram occurrences="9" value="¹â" /> + <ngram occurrences="9" value="_¸ª_" /> + <ngram occurrences="9" value="_¸ª" /> + <ngram occurrences="9" value="_õç" /> + <ngram occurrences="9" value="_õæ" /> + <ngram occurrences="9" value="_ô¸_" /> + <ngram occurrences="9" value="_ô¸" /> + <ngram occurrences="9" value="_î_" /> + <ngram occurrences="9" value="_âô" /> + <ngram occurrences="9" value="_ß" /> + <ngram occurrences="9" value="_¹_" /> + <ngram occurrences="8" value="¸ë_" /> + <ngram occurrences="8" value="¸ë" /> + <ngram occurrences="8" value="¸_ç" /> + <ngram occurrences="8" value="¨æ" /> + <ngram occurrences="8" value="¨_ç" /> + <ngram occurrences="8" value="½ü_" /> + <ngram occurrences="8" value="½õ_" /> + <ngram occurrences="8" value="½¹_" /> + <ngram occurrences="8" value="ÿõ_" /> + <ngram occurrences="8" value="ÿôæ" /> + <ngram occurrences="8" value="ÿ_ÿ" /> + <ngram occurrences="8" value="ý¹" /> + <ngram occurrences="8" value="ø¸" /> + <ngram occurrences="8" value="õø" /> + <ngram occurrences="8" value="õæõ" /> + <ngram occurrences="8" value="õ_õ_" /> + <ngram occurrences="8" value="õ_é" /> + <ngram occurrences="8" value="õ_â" /> + <ngram occurrences="8" value="ôÿ" /> + <ngram occurrences="8" value="ðç" /> + <ngram occurrences="8" value="í¨ì_" /> + <ngram occurrences="8" value="í¨ì" /> + <ngram occurrences="8" value="éÿ_õ_" /> + <ngram occurrences="8" value="éÿ_õ" /> + <ngram occurrences="8" value="è_" /> + <ngram occurrences="8" value="ç_¸" /> + <ngram occurrences="8" value="ç_þ_" /> + <ngram occurrences="8" value="ç_õ" /> + <ngram occurrences="8" value="æõ_" /> + <ngram occurrences="8" value="âÿ" /> + <ngram occurrences="8" value="áô_" /> + <ngram occurrences="8" value="ºõ" /> + <ngram occurrences="8" value="ªä" /> + <ngram occurrences="8" value="n" /> + <ngram occurrences="8" value="_¸õå" /> + <ngram occurrences="8" value="_½ü_" /> + <ngram occurrences="8" value="_½¹_" /> + <ngram occurrences="8" value="_ü" /> + <ngram occurrences="8" value="_ù_" /> + <ngram occurrences="8" value="_ø¸" /> + <ngram occurrences="8" value="_øâ" /> + <ngram occurrences="8" value="_ö" /> + <ngram occurrences="8" value="_ðç" /> + <ngram occurrences="8" value="_í¨ì_" /> + <ngram occurrences="8" value="_í¨ì" /> + <ngram occurrences="8" value="_í_" /> + <ngram occurrences="8" value="_éÿ_õ" /> + <ngram occurrences="8" value="_áô" /> + <ngram occurrences="7" value="¸ùä" /> + <ngram occurrences="7" value="¸õ¨" /> + <ngram occurrences="7" value="¸ô_" /> + <ngram occurrences="7" value="¸äõ" /> + <ngram occurrences="7" value="¸_é" /> + <ngram occurrences="7" value="½õù" /> + <ngram occurrences="7" value="½ôà" /> + <ngram occurrences="7" value="½_å" /> + <ngram occurrences="7" value="ÿâ" /> + <ngram occurrences="7" value="ùå" /> + <ngram occurrences="7" value="ùä_" /> + <ngram occurrences="7" value="ùâ_" /> + <ngram occurrences="7" value="øÿ_" /> + <ngram occurrences="7" value="ø_õ" /> + <ngram occurrences="7" value="õ¸ª_" /> + <ngram occurrences="7" value="õ¸ª" /> + <ngram occurrences="7" value="õ¨_" /> + <ngram occurrences="7" value="õÿ" /> + <ngram occurrences="7" value="õàõ_" /> + <ngram occurrences="7" value="õàõ" /> + <ngram occurrences="7" value="õ_½ô" /> + <ngram occurrences="7" value="ôà_" /> + <ngram occurrences="7" value="ô_ù" /> + <ngram occurrences="7" value="ðç_" /> + <ngram occurrences="7" value="èý" /> + <ngram occurrences="7" value="çâ_" /> + <ngram occurrences="7" value="æ_½" /> + <ngram occurrences="7" value="å¨" /> + <ngram occurrences="7" value="åâ_" /> + <ngram occurrences="7" value="åâ" /> + <ngram occurrences="7" value="äõ_" /> + <ngram occurrences="7" value="â_¸" /> + <ngram occurrences="7" value="_½õù" /> + <ngram occurrences="7" value="_½õ_" /> + <ngram occurrences="7" value="_ÿõ" /> + <ngram occurrences="7" value="_ÿô_" /> + <ngram occurrences="7" value="_ø_" /> + <ngram occurrences="7" value="_õ¨" /> + <ngram occurrences="7" value="_õç_" /> + <ngram occurrences="7" value="_õæõ" /> + <ngram occurrences="7" value="_õàõ_" /> + <ngram occurrences="7" value="_õàõ" /> + <ngram occurrences="7" value="_ðç_" /> + <ngram occurrences="7" value="_èý" /> + <ngram occurrences="7" value="_çÿ_" /> + <ngram occurrences="7" value="_çÿ" /> + <ngram occurrences="7" value="_çâ" /> + <ngram occurrences="7" value="_åõ_" /> + <ngram occurrences="7" value="_åõ" /> + <ngram occurrences="7" value="_áô_" /> + <ngram occurrences="7" value="_á_" /> + <ngram occurrences="6" value="¸ùä_" /> + <ngram occurrences="6" value="¸õ¨åæ" /> + <ngram occurrences="6" value="¸õ¨å" /> + <ngram occurrences="6" value="¨åæ_" /> + <ngram occurrences="6" value="¨åæ" /> + <ngram occurrences="6" value="½ôâ" /> + <ngram occurrences="6" value="½àõ" /> + <ngram occurrences="6" value="½¹õ¸" /> + <ngram occurrences="6" value="½¹õ" /> + <ngram occurrences="6" value="ÿö" /> + <ngram occurrences="6" value="ÿôæ_" /> + <ngram occurrences="6" value="ÿô_õ" /> + <ngram occurrences="6" value="ÿâ_" /> + <ngram occurrences="6" value="ÿ_ô" /> + <ngram occurrences="6" value="ù¸_" /> + <ngram occurrences="6" value="ùà_" /> + <ngram occurrences="6" value="ùà" /> + <ngram occurrences="6" value="ø½_" /> + <ngram occurrences="6" value="õ¸õ" /> + <ngram occurrences="6" value="õ¨åæ_" /> + <ngram occurrences="6" value="õ¨åæ" /> + <ngram occurrences="6" value="õ¨å" /> + <ngram occurrences="6" value="õâ" /> + <ngram occurrences="6" value="õáõ" /> + <ngram occurrences="6" value="ô½" /> + <ngram occurrences="6" value="ôÿ_" /> + <ngram occurrences="6" value="ôù" /> + <ngram occurrences="6" value="ôã" /> + <ngram occurrences="6" value="ôâ_" /> + <ngram occurrences="6" value="ô_ø" /> + <ngram occurrences="6" value="èý¹" /> + <ngram occurrences="6" value="çùÿ" /> + <ngram occurrences="6" value="ç_½" /> + <ngram occurrences="6" value="ç_õ_" /> + <ngram occurrences="6" value="åô_" /> + <ngram occurrences="6" value="åæ_" /> + <ngram occurrences="6" value="åæ" /> + <ngram occurrences="6" value="å_õ" /> + <ngram occurrences="6" value="âÿ_" /> + <ngram occurrences="6" value="âô_" /> + <ngram occurrences="6" value="âà" /> + <ngram occurrences="6" value="â_ô" /> + <ngram occurrences="6" value="áõ_" /> + <ngram occurrences="6" value="à¸" /> + <ngram occurrences="6" value="à_½" /> + <ngram occurrences="6" value="à_â" /> + <ngram occurrences="6" value="¹õ¸" /> + <ngram occurrences="6" value="¹õ" /> + <ngram occurrences="6" value="t" /> + <ngram occurrences="6" value="f" /> + <ngram occurrences="6" value="d" /> + <ngram occurrences="6" value="c" /> + <ngram occurrences="6" value="_¸_½" /> + <ngram occurrences="6" value="_½àõ" /> + <ngram occurrences="6" value="_½à_" /> + <ngram occurrences="6" value="_½¹õ¸" /> + <ngram occurrences="6" value="_½¹õ" /> + <ngram occurrences="6" value="_ÿö" /> + <ngram occurrences="6" value="_ÿôæ" /> + <ngram occurrences="6" value="_ö_" /> +</ngrams> diff --git a/src/plugins/language/thai.klp b/src/plugins/language/thai.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="890" value="_" /> + <ngram occurrences="343" value="ò" /> + <ngram occurrences="343" value="ã" /> + <ngram occurrences="243" value="¹" /> + <ngram occurrences="223" value="á" /> + <ngram occurrences="204" value="í" /> + <ngram occurrences="204" value="è" /> + <ngram occurrences="173" value="é" /> + <ngram occurrences="172" value="ç" /> + <ngram occurrences="165" value="à" /> + <ngram occurrences="159" value="â" /> + <ngram occurrences="151" value="ñ" /> + <ngram occurrences="117" value="¸" /> + <ngram occurrences="111" value="õ" /> + <ngram occurrences="111" value="å" /> + <ngram occurrences="107" value="_ã" /> + <ngram occurrences="106" value="µ" /> + <ngram occurrences="95" value="ð" /> + <ngram occurrences="95" value="í_" /> + <ngram occurrences="94" value="ò_" /> + <ngram occurrences="89" value="ê" /> + <ngram occurrences="84" value="ô" /> + <ngram occurrences="84" value="_í" /> + <ngram occurrences="78" value="º" /> + <ngram occurrences="76" value="ä" /> + <ngram occurrences="75" value="ë" /> + <ngram occurrences="75" value="_ò" /> + <ngram occurrences="71" value="òã" /> + <ngram occurrences="67" value="¨" /> + <ngram occurrences="63" value="à_" /> + <ngram occurrences="62" value="¹_" /> + <ngram occurrences="59" value="ñ_" /> + <ngram occurrences="54" value="ÿ" /> + <ngram occurrences="54" value="â_" /> + <ngram occurrences="54" value="_òã" /> + <ngram occurrences="53" value="á_" /> + <ngram occurrences="53" value="ª" /> + <ngram occurrences="53" value="_à" /> + <ngram occurrences="52" value="_á" /> + <ngram occurrences="51" value="ã_" /> + <ngram occurrences="51" value="_ç" /> + <ngram occurrences="49" value="òâ" /> + <ngram occurrences="48" value="èò" /> + <ngram occurrences="48" value="_é" /> + <ngram occurrences="45" value="_í_" /> + <ngram occurrences="43" value="_õ" /> + <ngram occurrences="39" value="õè" /> + <ngram occurrences="39" value="è_" /> + <ngram occurrences="37" value="ø" /> + <ngram occurrences="36" value="ãð" /> + <ngram occurrences="36" value="_õè" /> + <ngram occurrences="36" value="_¹" /> + <ngram occurrences="34" value="ì" /> + <ngram occurrences="34" value="éò" /> + <ngram occurrences="33" value="ù" /> + <ngram occurrences="33" value="¹ò" /> + <ngram occurrences="33" value="_ãð" /> + <ngram occurrences="32" value="å_" /> + <ngram occurrences="31" value="éí" /> + <ngram occurrences="31" value="_è" /> + <ngram occurrences="30" value="_ñ" /> + <ngram occurrences="29" value="ãñ" /> + <ngram occurrences="29" value="³" /> + <ngram occurrences="28" value="ó" /> + <ngram occurrences="28" value="ç¹" /> + <ngram occurrences="28" value="ãò" /> + <ngram occurrences="26" value="òâ_" /> + <ngram occurrences="26" value="èò_" /> + <ngram occurrences="26" value="ãã" /> + <ngram occurrences="26" value="_å" /> + <ngram occurrences="26" value="_ä" /> + <ngram occurrences="25" value="ì_" /> + <ngram occurrences="25" value="é_" /> + <ngram occurrences="24" value="¸é" /> + <ngram occurrences="24" value="çè" /> + <ngram occurrences="24" value="ç_" /> + <ngram occurrences="24" value="º_" /> + <ngram occurrences="23" value="õ_" /> + <ngram occurrences="23" value="ñº" /> + <ngram occurrences="23" value="ð_" /> + <ngram occurrences="23" value="çèò" /> + <ngram occurrences="23" value="_éò" /> + <ngram occurrences="23" value="_º" /> + <ngram occurrences="22" value="_¨" /> + <ngram occurrences="21" value="¸_" /> + <ngram occurrences="21" value="½" /> + <ngram occurrences="21" value="òá" /> + <ngram occurrences="21" value="éí_" /> + <ngram occurrences="21" value="èí" /> + <ngram occurrences="21" value="ä_" /> + <ngram occurrences="21" value="ã¹" /> + <ngram occurrences="21" value="_ê" /> + <ngram occurrences="20" value="ô_" /> + <ngram occurrences="20" value="òã_" /> + <ngram occurrences="20" value="ò¹" /> + <ngram occurrences="20" value="éç" /> + <ngram occurrences="20" value="áè" /> + <ngram occurrences="20" value="_â" /> + <ngram occurrences="19" value="äá" /> + <ngram occurrences="19" value="áå" /> + <ngram occurrences="19" value="µã" /> + <ngram occurrences="19" value="_à_" /> + <ngram occurrences="18" value="èç" /> + <ngram occurrences="18" value="äáè" /> + <ngram occurrences="18" value="ãñ_" /> + <ngram occurrences="18" value="µè" /> + <ngram occurrences="18" value="_ÿ" /> + <ngram occurrences="18" value="_ãñ" /> + <ngram occurrences="17" value="¨ð" /> + <ngram occurrences="17" value="ëò" /> + <ngram occurrences="17" value="çò" /> + <ngram occurrences="17" value="çá" /> + <ngram occurrences="17" value="ä¸é" /> + <ngram occurrences="17" value="ä¸" /> + <ngram occurrences="16" value="òµ" /> + <ngram occurrences="16" value="çèò_" /> + <ngram occurrences="16" value="ãòâ" /> + <ngram occurrences="16" value="ãá" /> + <ngram occurrences="16" value="áõ" /> + <ngram occurrences="16" value="áò" /> + <ngram occurrences="16" value="¹òâ" /> + <ngram occurrences="16" value="ªò" /> + <ngram occurrences="16" value="_ô" /> + <ngram occurrences="16" value="_ë" /> + <ngram occurrences="16" value="_ª" /> + <ngram occurrences="15" value="ö" /> + <ngram occurrences="15" value="ò_ã" /> + <ngram occurrences="15" value="åð" /> + <ngram occurrences="15" value="ãà" /> + <ngram occurrences="15" value="_òã_" /> + <ngram occurrences="15" value="_éí" /> + <ngram occurrences="15" value="_ãñ_" /> + <ngram occurrences="15" value="_µ" /> + <ngram occurrences="14" value="ù_" /> + <ngram occurrences="14" value="ò_ò" /> + <ngram occurrences="14" value="ñé" /> + <ngram occurrences="14" value="ðà" /> + <ngram occurrences="14" value="íâ" /> + <ngram occurrences="14" value="é¹" /> + <ngram occurrences="14" value="ãë" /> + <ngram occurrences="14" value="â_ã" /> + <ngram occurrences="14" value="á_í" /> + <ngram occurrences="14" value="à_ç" /> + <ngram occurrences="14" value="µô" /> + <ngram occurrences="13" value="òãà" /> + <ngram occurrences="13" value="ò_òã" /> + <ngram occurrences="13" value="ñ¹" /> + <ngram occurrences="13" value="íá" /> + <ngram occurrences="13" value="í_ã" /> + <ngram occurrences="13" value="è¹" /> + <ngram occurrences="13" value="à_ç¹" /> + <ngram occurrences="13" value="¹à" /> + <ngram occurrences="13" value="_òãà" /> + <ngram occurrences="13" value="_ç¹" /> + <ngram occurrences="12" value="ÿã" /> + <ngram occurrences="12" value="ö_" /> + <ngram occurrences="12" value="ñ¸" /> + <ngram occurrences="12" value="ñ_á" /> + <ngram occurrences="12" value="í¹" /> + <ngram occurrences="12" value="ëé" /> + <ngram occurrences="12" value="ë¹" /> + <ngram occurrences="12" value="éá" /> + <ngram occurrences="12" value="è_ã" /> + <ngram occurrences="12" value="çòá" /> + <ngram occurrences="12" value="ç¹_" /> + <ngram occurrences="12" value="ãëé" /> + <ngram occurrences="12" value="âñ" /> + <ngram occurrences="12" value="áåð" /> + <ngram occurrences="12" value="á¹" /> + <ngram occurrences="12" value="áµ" /> + <ngram occurrences="12" value="àò" /> + <ngram occurrences="12" value="ºò" /> + <ngram occurrences="12" value="¹ñ" /> + <ngram occurrences="12" value="µé" /> + <ngram occurrences="12" value="_¸" /> + <ngram occurrences="12" value="_èí" /> + <ngram occurrences="12" value="_çòá" /> + <ngram occurrences="12" value="_çò" /> + <ngram occurrences="12" value="_¹ò" /> + <ngram occurrences="11" value="¸ã" /> + <ngram occurrences="11" value="õé" /> + <ngram occurrences="11" value="õè_" /> + <ngram occurrences="11" value="õâ" /> + <ngram occurrences="11" value="ô¹" /> + <ngram occurrences="11" value="íã" /> + <ngram occurrences="11" value="êà" /> + <ngram occurrences="11" value="ê_" /> + <ngram occurrences="11" value="éò_" /> + <ngram occurrences="11" value="çâ" /> + <ngram occurrences="11" value="åñ" /> + <ngram occurrences="11" value="áà" /> + <ngram occurrences="11" value="àë" /> + <ngram occurrences="11" value="àá" /> + <ngram occurrences="11" value="¹õé" /> + <ngram occurrences="11" value="¹õ" /> + <ngram occurrences="11" value="¹ò_" /> + <ngram occurrences="11" value="¹ç" /> + <ngram occurrences="11" value="µñ" /> + <ngram occurrences="11" value="_õè_" /> + <ngram occurrences="11" value="_ãò" /> + <ngram occurrences="10" value="ø_" /> + <ngram occurrences="10" value="ô¸" /> + <ngram occurrences="10" value="êè" /> + <ngram occurrences="10" value="èá" /> + <ngram occurrences="10" value="åé" /> + <ngram occurrences="10" value="åè" /> + <ngram occurrences="10" value="å_í" /> + <ngram occurrences="10" value="ã¨" /> + <ngram occurrences="10" value="ãðà" /> + <ngram occurrences="10" value="ãí" /> + <ngram occurrences="10" value="ãì" /> + <ngram occurrences="10" value="ã_í" /> + <ngram occurrences="10" value="áê" /> + <ngram occurrences="10" value="àá_" /> + <ngram occurrences="10" value="àµ" /> + <ngram occurrences="10" value="à_ô" /> + <ngram occurrences="10" value="¹í" /> + <ngram occurrences="10" value="¹á" /> + <ngram occurrences="10" value="¹µ" /> + <ngram occurrences="10" value="µéí_" /> + <ngram occurrences="10" value="µéí" /> + <ngram occurrences="10" value="³ð" /> + <ngram occurrences="10" value="_ô¸" /> + <ngram occurrences="10" value="_ó" /> + <ngram occurrences="10" value="_ò_" /> + <ngram occurrences="10" value="_éí_" /> + <ngram occurrences="10" value="_ãòâ" /> + <ngram occurrences="10" value="_ãðà" /> + <ngram occurrences="9" value="¸ô" /> + <ngram occurrences="9" value="¨ò" /> + <ngram occurrences="9" value="ÿå" /> + <ngram occurrences="9" value="íà" /> + <ngram occurrences="9" value="í_í" /> + <ngram occurrences="9" value="ëòã" /> + <ngram occurrences="9" value="éò¹" /> + <ngram occurrences="9" value="ãô" /> + <ngram occurrences="9" value="ãñº" /> + <ngram occurrences="9" value="ããá" /> + <ngram occurrences="9" value="â¸" /> + <ngram occurrences="9" value="âñ_" /> + <ngram occurrences="9" value="áµè" /> + <ngram occurrences="9" value="á_í_" /> + <ngram occurrences="9" value="à_é" /> + <ngram occurrences="9" value="ºã" /> + <ngram occurrences="9" value="_ñº" /> + <ngram occurrences="9" value="_ñ_" /> + <ngram occurrences="9" value="_áåð" /> + <ngram occurrences="9" value="_áå" /> + <ngram occurrences="9" value="_áµ" /> + <ngram occurrences="9" value="_á_" /> + <ngram occurrences="9" value="_ºò" /> + <ngram occurrences="8" value="¸õ" /> + <ngram occurrences="8" value="¨ò_" /> + <ngram occurrences="8" value="¨ñ" /> + <ngram occurrences="8" value="òê" /> + <ngram occurrences="8" value="òå" /> + <ngram occurrences="8" value="ò¹_" /> + <ngram occurrences="8" value="òµô" /> + <ngram occurrences="8" value="ñ¸_" /> + <ngram occurrences="8" value="ñé¹" /> + <ngram occurrences="8" value="ñº_" /> + <ngram occurrences="8" value="ðä" /> + <ngram occurrences="8" value="ðà_" /> + <ngram occurrences="8" value="íº" /> + <ngram occurrences="8" value="ëç" /> + <ngram occurrences="8" value="èí_" /> + <ngram occurrences="8" value="èä" /> + <ngram occurrences="8" value="çñ" /> + <ngram occurrences="8" value="çé" /> + <ngram occurrences="8" value="å_í_" /> + <ngram occurrences="8" value="å_ã" /> + <ngram occurrences="8" value="ãõ" /> + <ngram occurrences="8" value="ãé" /> + <ngram occurrences="8" value="ãç" /> + <ngram occurrences="8" value="ãã_" /> + <ngram occurrences="8" value="ãá_" /> + <ngram occurrences="8" value="âí" /> + <ngram occurrences="8" value="âç" /> + <ngram occurrences="8" value="áë" /> + <ngram occurrences="8" value="à¸" /> + <ngram occurrences="8" value="¹òâ_" /> + <ngram occurrences="8" value="¹_ò" /> + <ngram occurrences="8" value="¹_í" /> + <ngram occurrences="8" value="ªòµô" /> + <ngram occurrences="8" value="ªòµ" /> + <ngram occurrences="8" value="_ø" /> + <ngram occurrences="8" value="_ëò" /> + <ngram occurrences="8" value="_éò_" /> + <ngram occurrences="8" value="_áµè" /> + <ngram occurrences="8" value="_¹òâ" /> + <ngram occurrences="8" value="_³ð" /> + <ngram occurrences="8" value="_³" /> + <ngram occurrences="7" value="¸éç" /> + <ngram occurrences="7" value="¸â" /> + <ngram occurrences="7" value="½ù" /> + <ngram occurrences="7" value="ÿô" /> + <ngram occurrences="7" value="ÿñ" /> + <ngram occurrences="7" value="ÿå_" /> + <ngram occurrences="7" value="ÿãã_" /> + <ngram occurrences="7" value="ÿãã" /> + <ngram occurrences="7" value="ùé" /> + <ngram occurrences="7" value="õé_" /> + <ngram occurrences="7" value="ò¸" /> + <ngram occurrences="7" value="ñé¹_" /> + <ngram occurrences="7" value="ñ_ºòå" /> + <ngram occurrences="7" value="ñ_ºò" /> + <ngram occurrences="7" value="ñ_º" /> + <ngram occurrences="7" value="ðà_è" /> + <ngram occurrences="7" value="íí" /> + <ngram occurrences="7" value="í¹_" /> + <ngram occurrences="7" value="í_ñ" /> + <ngram occurrences="7" value="í_ª" /> + <ngram occurrences="7" value="ëå" /> + <ngram occurrences="7" value="éà" /> + <ngram occurrences="7" value="é¹_" /> + <ngram occurrences="7" value="èç¹" /> + <ngram occurrences="7" value="èâ" /> + <ngram occurrences="7" value="è_ãð" /> + <ngram occurrences="7" value="åñ_" /> + <ngram occurrences="7" value="äçé" /> + <ngram occurrences="7" value="äç" /> + <ngram occurrences="7" value="ãø" /> + <ngram occurrences="7" value="ãõ_" /> + <ngram occurrences="7" value="ãòâ_" /> + <ngram occurrences="7" value="ãñ_ºò" /> + <ngram occurrences="7" value="ãñ_º" /> + <ngram occurrences="7" value="ãðà_è" /> + <ngram occurrences="7" value="ãðà_" /> + <ngram occurrences="7" value="ãð_" /> + <ngram occurrences="7" value="ãì_" /> + <ngram occurrences="7" value="ãè" /> + <ngram occurrences="7" value="ã¹_" /> + <ngram occurrences="7" value="ã_ã" /> + <ngram occurrences="7" value="â¸â" /> + <ngram occurrences="7" value="âì" /> + <ngram occurrences="7" value="âã" /> + <ngram occurrences="7" value="âá" /> + <ngram occurrences="7" value="áÿ" /> + <ngram occurrences="7" value="áåé" /> + <ngram occurrences="7" value="áã" /> + <ngram occurrences="7" value="à_ô¸" /> + <ngram occurrences="7" value="à_éò" /> + <ngram occurrences="7" value="à_è" /> + <ngram occurrences="7" value="ºòå" /> + <ngram occurrences="7" value="¹õé_" /> + <ngram occurrences="7" value="¹ñé¹" /> + <ngram occurrences="7" value="¹ñé" /> + <ngram occurrences="7" value="¹ê" /> + <ngram occurrences="7" value="¹é" /> + <ngram occurrences="7" value="¹µã" /> + <ngram occurrences="7" value="¹_òã" /> + <ngram occurrences="7" value="µ_" /> + <ngram occurrences="7" value="_¨ð" /> + <ngram occurrences="7" value="_ÿå" /> + <ngram occurrences="7" value="_í_ã" /> + <ngram occurrences="7" value="_í_ª" /> + <ngram occurrences="7" value="_ê_" /> + <ngram occurrences="7" value="_äáè" /> + <ngram occurrences="7" value="_äá" /> + <ngram occurrences="7" value="_ãðà_" /> + <ngram occurrences="7" value="_á¹" /> + <ngram occurrences="7" value="_ºòå" /> + <ngram occurrences="7" value="_º_" /> + <ngram occurrences="6" value="¸ããá" /> + <ngram occurrences="6" value="¸ãã" /> + <ngram occurrences="6" value="¸à" /> + <ngram occurrences="6" value="¸_éí" /> + <ngram occurrences="6" value="¸_é" /> + <ngram occurrences="6" value="¨ñ¸" /> + <ngram occurrences="6" value="¨_" /> + <ngram occurrences="6" value="½ùé" /> + <ngram occurrences="6" value="½è" /> + <ngram occurrences="6" value="ÿò" /> + <ngram occurrences="6" value="ÿå_í_" /> + <ngram occurrences="6" value="ÿå_í" /> + <ngram occurrences="6" value="õèâ" /> + <ngram occurrences="6" value="ôë" /> + <ngram occurrences="6" value="ôª" /> + <ngram occurrences="6" value="ó¹" /> + <ngram occurrences="6" value="ò¨" /> + <ngram occurrences="6" value="òð" /> + <ngram occurrences="6" value="òç" /> + <ngram occurrences="6" value="òãàá_" /> + <ngram occurrences="6" value="òãàá" /> + <ngram occurrences="6" value="òá_" /> + <ngram occurrences="6" value="òà" /> + <ngram occurrences="6" value="ò³" /> + <ngram occurrences="6" value="òª" /> + <ngram occurrences="6" value="ò_òãà" /> + <ngram occurrences="6" value="ò_ç" /> + <ngram occurrences="6" value="ñé_" /> + <ngram occurrences="6" value="ñâ" /> + <ngram occurrences="6" value="ñ²¹" /> + <ngram occurrences="6" value="ñ²" /> + <ngram occurrences="6" value="ñ_ëò" /> + <ngram occurrences="6" value="ñ_ë" /> + <ngram occurrences="6" value="ñ_á¹µ" /> + <ngram occurrences="6" value="ñ_á¹" /> + <ngram occurrences="6" value="ðê" /> + <ngram occurrences="6" value="ðâ" /> +</ngrams> diff --git a/src/plugins/language/turkish.klp b/src/plugins/language/turkish.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="975" value="_" /> + <ngram occurrences="470" value="i" /> + <ngram occurrences="439" value="a" /> + <ngram occurrences="316" value="e" /> + <ngram occurrences="276" value="n" /> + <ngram occurrences="249" value="i_" /> + <ngram occurrences="244" value="l" /> + <ngram occurrences="239" value="r" /> + <ngram occurrences="218" value="_i" /> + <ngram occurrences="181" value="_i_" /> + <ngram occurrences="175" value="k" /> + <ngram occurrences="172" value="s" /> + <ngram occurrences="148" value="d" /> + <ngram occurrences="128" value="n_" /> + <ngram occurrences="119" value="t" /> + <ngram occurrences="113" value="y" /> + <ngram occurrences="110" value="m" /> + <ngram occurrences="105" value="u" /> + <ngram occurrences="98" value="a_" /> + <ngram occurrences="97" value="o" /> + <ngram occurrences="93" value="_s" /> + <ngram occurrences="90" value="b" /> + <ngram occurrences="87" value="s_" /> + <ngram occurrences="81" value="e_" /> + <ngram occurrences="75" value="ar" /> + <ngram occurrences="73" value="la" /> + <ngram occurrences="73" value="g" /> + <ngram occurrences="70" value="_b" /> + <ngram occurrences="66" value="an" /> + <ngram occurrences="65" value="ü" /> + <ngram occurrences="64" value="_s_" /> + <ngram occurrences="62" value="_g" /> + <ngram occurrences="60" value="_k" /> + <ngram occurrences="59" value="in" /> + <ngram occurrences="58" value="r_" /> + <ngram occurrences="56" value="k_" /> + <ngram occurrences="54" value="ra" /> + <ngram occurrences="53" value="_n" /> + <ngram occurrences="52" value="le" /> + <ngram occurrences="50" value="i_n" /> + <ngram occurrences="50" value="_y" /> + <ngram occurrences="49" value="il" /> + <ngram occurrences="49" value="_i_n" /> + <ngram occurrences="48" value="er" /> + <ngram occurrences="48" value="da" /> + <ngram occurrences="45" value="_a" /> + <ngram occurrences="44" value="z" /> + <ngram occurrences="43" value="_d" /> + <ngram occurrences="42" value="i_s" /> + <ngram occurrences="40" value="en" /> + <ngram occurrences="40" value="de" /> + <ngram occurrences="39" value="s_i" /> + <ngram occurrences="39" value="p" /> + <ngram occurrences="39" value="nd" /> + <ngram occurrences="39" value="_t" /> + <ngram occurrences="38" value="_l" /> + <ngram occurrences="37" value="lar" /> + <ngram occurrences="37" value="l_" /> + <ngram occurrences="36" value="i_s_" /> + <ngram occurrences="34" value="ya" /> + <ngram occurrences="34" value="ri" /> + <ngram occurrences="34" value="ka" /> + <ngram occurrences="33" value="v" /> + <ngram occurrences="33" value="g_" /> + <ngram occurrences="33" value="c" /> + <ngram occurrences="32" value="u_" /> + <ngram occurrences="32" value="s_i_" /> + <ngram occurrences="31" value="in_" /> + <ngram occurrences="30" value="ç" /> + <ngram occurrences="30" value="ma" /> + <ngram occurrences="30" value="bi" /> + <ngram occurrences="30" value="an_" /> + <ngram occurrences="30" value="ak" /> + <ngram occurrences="30" value="_i_s" /> + <ngram occurrences="30" value="_g_" /> + <ngram occurrences="29" value="ol" /> + <ngram occurrences="29" value="ara" /> + <ngram occurrences="29" value="ar_" /> + <ngram occurrences="28" value="ler" /> + <ngram occurrences="28" value="ki" /> + <ngram occurrences="28" value="i_n_" /> + <ngram occurrences="28" value="_o" /> + <ngram occurrences="28" value="_n_" /> + <ngram occurrences="28" value="_i_n_" /> + <ngram occurrences="27" value="re" /> + <ngram occurrences="27" value="h" /> + <ngram occurrences="27" value="eri" /> + <ngram occurrences="27" value="_i_s_" /> + <ngram occurrences="26" value="si" /> + <ngram occurrences="26" value="ir" /> + <ngram occurrences="26" value="ek" /> + <ngram occurrences="26" value="da_" /> + <ngram occurrences="24" value="li" /> + <ngram occurrences="24" value="_m" /> + <ngram occurrences="24" value="_ka" /> + <ngram occurrences="23" value="ni" /> + <ngram occurrences="23" value="me" /> + <ngram occurrences="23" value="ba" /> + <ngram occurrences="22" value="te" /> + <ngram occurrences="22" value="on" /> + <ngram occurrences="22" value="nda" /> + <ngram occurrences="22" value="n_i" /> + <ngram occurrences="22" value="leri" /> + <ngram occurrences="22" value="g_i" /> + <ngram occurrences="22" value="di" /> + <ngram occurrences="22" value="_s_i" /> + <ngram occurrences="22" value="_bi" /> + <ngram occurrences="21" value="ö" /> + <ngram occurrences="21" value="ve" /> + <ngram occurrences="21" value="f" /> + <ngram occurrences="21" value="en_" /> + <ngram occurrences="21" value="al" /> + <ngram occurrences="21" value="_v" /> + <ngram occurrences="20" value="un" /> + <ngram occurrences="20" value="t_" /> + <ngram occurrences="20" value="n_i_" /> + <ngram occurrences="20" value="lar_" /> + <ngram occurrences="20" value="g_i_" /> + <ngram occurrences="20" value="et" /> + <ngram occurrences="20" value="ay" /> + <ngram occurrences="20" value="at" /> + <ngram occurrences="20" value="_r" /> + <ngram occurrences="19" value="r_i" /> + <ngram occurrences="19" value="l_i" /> + <ngram occurrences="19" value="ile" /> + <ngram occurrences="19" value="i_g" /> + <ngram occurrences="19" value="d_" /> + <ngram occurrences="19" value="bu" /> + <ngram occurrences="19" value="a_g" /> + <ngram occurrences="19" value="_ya" /> + <ngram occurrences="19" value="_ol" /> + <ngram occurrences="19" value="_g_i" /> + <ngram occurrences="19" value="_e" /> + <ngram occurrences="19" value="_ba" /> + <ngram occurrences="18" value="r_i_" /> + <ngram occurrences="18" value="l_i_" /> + <ngram occurrences="18" value="i_nd" /> + <ngram occurrences="18" value="i_l" /> + <ngram occurrences="18" value="es" /> + <ngram occurrences="18" value="de_" /> + <ngram occurrences="18" value="d_i_" /> + <ngram occurrences="18" value="d_i" /> + <ngram occurrences="18" value="_ve" /> + <ngram occurrences="18" value="_nd" /> + <ngram occurrences="18" value="_i_nd" /> + <ngram occurrences="18" value="_i_l" /> + <ngram occurrences="17" value="nu" /> + <ngram occurrences="17" value="mi" /> + <ngram occurrences="17" value="_p" /> + <ngram occurrences="17" value="_g_i_" /> + <ngram occurrences="16" value="ye" /> + <ngram occurrences="16" value="y_" /> + <ngram occurrences="16" value="se" /> + <ngram occurrences="16" value="pa" /> + <ngram occurrences="16" value="or" /> + <ngram occurrences="16" value="ola" /> + <ngram occurrences="16" value="ki_" /> + <ngram occurrences="16" value="is" /> + <ngram occurrences="16" value="i_nda" /> + <ngram occurrences="16" value="_ü" /> + <ngram occurrences="16" value="_nda" /> + <ngram occurrences="16" value="_bu" /> + <ngram occurrences="15" value="ve_" /> + <ngram occurrences="15" value="ta" /> + <ngram occurrences="15" value="t_i" /> + <ngram occurrences="15" value="nl" /> + <ngram occurrences="15" value="na" /> + <ngram occurrences="15" value="n_y" /> + <ngram occurrences="15" value="ke" /> + <ngram occurrences="15" value="ge" /> + <ngram occurrences="15" value="el" /> + <ngram occurrences="15" value="ed" /> + <ngram occurrences="15" value="az" /> + <ngram occurrences="15" value="as" /> + <ngram occurrences="15" value="ar_i_" /> + <ngram occurrences="15" value="ar_i" /> + <ngram occurrences="15" value="am" /> + <ngram occurrences="15" value="ak_" /> + <ngram occurrences="15" value="a_s" /> + <ngram occurrences="15" value="_ve_" /> + <ngram occurrences="15" value="_s_i_" /> + <ngram occurrences="14" value="rl" /> + <ngram occurrences="14" value="rin" /> + <ngram occurrences="14" value="ko" /> + <ngram occurrences="14" value="ik" /> + <ngram occurrences="14" value="i_n_i" /> + <ngram occurrences="14" value="i_b" /> + <ngram occurrences="14" value="erin" /> + <ngram occurrences="14" value="as_i_" /> + <ngram occurrences="14" value="as_i" /> + <ngram occurrences="14" value="as_" /> + <ngram occurrences="14" value="a_s_" /> + <ngram occurrences="14" value="_n_i_" /> + <ngram occurrences="14" value="_n_i" /> + <ngram occurrences="14" value="_ge" /> + <ngram occurrences="13" value="z_" /> + <ngram occurrences="13" value="yü" /> + <ngram occurrences="13" value="yo" /> + <ngram occurrences="13" value="t_i_" /> + <ngram occurrences="13" value="sa" /> + <ngram occurrences="13" value="rk" /> + <ngram occurrences="13" value="ra_" /> + <ngram occurrences="13" value="nda_" /> + <ngram occurrences="13" value="m_" /> + <ngram occurrences="13" value="lar_i" /> + <ngram occurrences="13" value="iy" /> + <ngram occurrences="13" value="i_s_i" /> + <ngram occurrences="13" value="i_k" /> + <ngram occurrences="13" value="esi" /> + <ngram occurrences="13" value="em" /> + <ngram occurrences="13" value="dan" /> + <ngram occurrences="13" value="ad" /> + <ngram occurrences="13" value="_ola" /> + <ngram occurrences="13" value="_ko" /> + <ngram occurrences="13" value="_h" /> + <ngram occurrences="12" value="y_i_" /> + <ngram occurrences="12" value="y_i" /> + <ngram occurrences="12" value="ur" /> + <ngram occurrences="12" value="to" /> + <ngram occurrences="12" value="ti" /> + <ngram occurrences="12" value="s_i_n" /> + <ngram occurrences="12" value="ne" /> + <ngram occurrences="12" value="n_b" /> + <ngram occurrences="12" value="lm" /> + <ngram occurrences="12" value="lerin" /> + <ngram occurrences="12" value="ld" /> + <ngram occurrences="12" value="lara" /> + <ngram occurrences="12" value="im" /> + <ngram occurrences="12" value="i_r" /> + <ngram occurrences="12" value="ha" /> + <ngram occurrences="12" value="ap" /> + <ngram occurrences="12" value="anl" /> + <ngram occurrences="12" value="_pa" /> + <ngram occurrences="12" value="_de" /> + <ngram occurrences="11" value="tü" /> + <ngram occurrences="11" value="tl" /> + <ngram occurrences="11" value="rak" /> + <ngram occurrences="11" value="r_i_n" /> + <ngram occurrences="11" value="ir_" /> + <ngram occurrences="11" value="ini" /> + <ngram occurrences="11" value="g_i_n" /> + <ngram occurrences="11" value="ek_" /> + <ngram occurrences="11" value="dan_" /> + <ngram occurrences="11" value="bir" /> + <ngram occurrences="11" value="a_g_" /> + <ngram occurrences="11" value="_i_r" /> + <ngram occurrences="11" value="_da" /> + <ngram occurrences="11" value="_bir" /> + <ngram occurrences="10" value="ür" /> + <ngram occurrences="10" value="ük" /> + <ngram occurrences="10" value="ru" /> + <ngram occurrences="10" value="nin_" /> + <ngram occurrences="10" value="nin" /> + <ngram occurrences="10" value="nde" /> + <ngram occurrences="10" value="n_s" /> + <ngram occurrences="10" value="n_k" /> + <ngram occurrences="10" value="lan" /> + <ngram occurrences="10" value="kan" /> + <ngram occurrences="10" value="k_b" /> + <ngram occurrences="10" value="iz" /> + <ngram occurrences="10" value="i_g_i" /> + <ngram occurrences="10" value="i_g_" /> + <ngram occurrences="10" value="er_" /> + <ngram occurrences="10" value="ce" /> + <ngram occurrences="10" value="bil" /> + <ngram occurrences="10" value="_ç" /> + <ngram occurrences="10" value="_il" /> + <ngram occurrences="10" value="_i_k" /> + <ngram occurrences="10" value="_i_g" /> + <ngram occurrences="10" value="_ar" /> + <ngram occurrences="9" value="za" /> + <ngram occurrences="9" value="ya_" /> + <ngram occurrences="9" value="ul" /> + <ngram occurrences="9" value="su" /> + <ngram occurrences="9" value="sin" /> + <ngram occurrences="9" value="si_" /> + <ngram occurrences="9" value="s_l" /> + <ngram occurrences="9" value="rd" /> + <ngram occurrences="9" value="olar" /> + <ngram occurrences="9" value="li_" /> + <ngram occurrences="9" value="la_" /> + <ngram occurrences="9" value="kon" /> + <ngram occurrences="9" value="iler" /> + <ngram occurrences="9" value="i_y" /> + <ngram occurrences="9" value="i_d" /> + <ngram occurrences="9" value="ec" /> + <ngram occurrences="9" value="e_s" /> + <ngram occurrences="9" value="e_b" /> + <ngram occurrences="9" value="bu_" /> + <ngram occurrences="9" value="bir_" /> + <ngram occurrences="9" value="ba_" /> + <ngram occurrences="9" value="ala" /> + <ngram occurrences="9" value="af" /> + <ngram occurrences="9" value="ada" /> + <ngram occurrences="9" value="_yü" /> + <ngram occurrences="9" value="_te" /> + <ngram occurrences="9" value="_sa" /> + <ngram occurrences="9" value="_s_l" /> + <ngram occurrences="9" value="_la" /> + <ngram occurrences="9" value="_kon" /> + <ngram occurrences="9" value="_ha" /> + <ngram occurrences="9" value="_f" /> + <ngram occurrences="9" value="_bu_" /> + <ngram occurrences="9" value="_bir_" /> + <ngram occurrences="9" value="_ba_" /> + <ngram occurrences="8" value="ü_" /> + <ngram occurrences="8" value="çe" /> + <ngram occurrences="8" value="ye_" /> + <ngram occurrences="8" value="y_i_l" /> + <ngram occurrences="8" value="un_" /> + <ngram occurrences="8" value="um" /> + <ngram occurrences="8" value="rla" /> + <ngram occurrences="8" value="rin_" /> + <ngram occurrences="8" value="ri_" /> + <ngram occurrences="8" value="rak_" /> + <ngram occurrences="8" value="r_b" /> + <ngram occurrences="8" value="onu" /> + <ngram occurrences="8" value="on_" /> + <ngram occurrences="8" value="nla" /> + <ngram occurrences="8" value="lu" /> + <ngram occurrences="8" value="lma" /> + <ngram occurrences="8" value="lk" /> + <ngram occurrences="8" value="leri_" /> + <ngram occurrences="8" value="k_t" /> + <ngram occurrences="8" value="iye" /> + <ngram occurrences="8" value="inin_" /> + <ngram occurrences="8" value="inin" /> + <ngram occurrences="8" value="ind" /> + <ngram occurrences="8" value="i_t" /> + <ngram occurrences="8" value="eç" /> + <ngram occurrences="8" value="esi_" /> + <ngram occurrences="8" value="erin_" /> + <ngram occurrences="8" value="eri_" /> + <ngram occurrences="8" value="eni" /> + <ngram occurrences="8" value="eki" /> + <ngram occurrences="8" value="edi" /> + <ngram occurrences="8" value="ece" /> + <ngram occurrences="8" value="e_i" /> + <ngram occurrences="8" value="di_" /> + <ngram occurrences="8" value="ci" /> + <ngram occurrences="8" value="ba_s_" /> + <ngram occurrences="8" value="ba_s" /> + <ngram occurrences="8" value="arak" /> + <ngram occurrences="8" value="ara_" /> + <ngram occurrences="8" value="ama" /> + <ngram occurrences="8" value="ab" /> + <ngram occurrences="8" value="a_b" /> + <ngram occurrences="8" value="a_a" /> + <ngram occurrences="8" value="_y_i_" /> + <ngram occurrences="8" value="_y_i" /> + <ngram occurrences="8" value="_y_" /> + <ngram occurrences="8" value="_tü" /> + <ngram occurrences="8" value="_ra" /> + <ngram occurrences="8" value="_nda_" /> + <ngram occurrences="8" value="_me" /> + <ngram occurrences="8" value="_li" /> + <ngram occurrences="8" value="_l_" /> + <ngram occurrences="8" value="_k_" /> + <ngram occurrences="8" value="_da_" /> + <ngram occurrences="8" value="_ba_s" /> + <ngram occurrences="7" value="ürk" /> + <ngram occurrences="7" value="ün" /> + <ngram occurrences="7" value="ör" /> + <ngram occurrences="7" value="yan" /> + <ngram occurrences="7" value="unu" /> + <ngram occurrences="7" value="türk" /> + <ngram occurrences="7" value="tür" /> + <ngram occurrences="7" value="s_m" /> + <ngram occurrences="7" value="s_i_s" /> + <ngram occurrences="7" value="par" /> + <ngram occurrences="7" value="olara" /> + <ngram occurrences="7" value="ndan_" /> + <ngram occurrences="7" value="ndan" /> + <ngram occurrences="7" value="n_t" /> + <ngram occurrences="7" value="n_li" /> + <ngram occurrences="7" value="n_l" /> + <ngram occurrences="7" value="n_i_n" /> + <ngram occurrences="7" value="n_d" /> + <ngram occurrences="7" value="n_a" /> + <ngram occurrences="7" value="mesi" /> + <ngram occurrences="7" value="mes" /> + <ngram occurrences="7" value="ma_" /> + <ngram occurrences="7" value="lke" /> + <ngram occurrences="7" value="lir" /> + <ngram occurrences="7" value="kanl" /> + <ngram occurrences="7" value="k_k" /> + <ngram occurrences="7" value="inde" /> + <ngram occurrences="7" value="ik_" /> + <ngram occurrences="7" value="i_ve" /> + <ngram occurrences="7" value="i_v" /> + <ngram occurrences="7" value="i_o" /> + <ngram occurrences="7" value="i_k_" /> + <ngram occurrences="7" value="i_i" /> + <ngram occurrences="7" value="i_a" /> + <ngram occurrences="7" value="geç" /> + <ngram occurrences="7" value="e_g" /> + <ngram occurrences="7" value="dil" /> + <ngram occurrences="7" value="cu" /> + <ngram occurrences="7" value="bin_" /> + <ngram occurrences="7" value="bin" /> +</ngrams> diff --git a/src/plugins/language/ukrainian.klp b/src/plugins/language/ukrainian.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="835" value="_" /> + <ngram occurrences="360" value="ï" /> + <ngram occurrences="292" value="á" /> + <ngram occurrences="243" value="é" /> + <ngram occurrences="211" value="¨" /> + <ngram occurrences="191" value="î" /> + <ngram occurrences="169" value="ô" /> + <ngram occurrences="163" value="ò" /> + <ngram occurrences="163" value="ä" /> + <ngram occurrences="153" value="å" /> + <ngram occurrences="136" value="ì" /> + <ngram occurrences="133" value="ë" /> + <ngram occurrences="131" value="ó" /> + <ngram occurrences="124" value="á_" /> + <ngram occurrences="123" value="ð" /> + <ngram occurrences="119" value="õ" /> + <ngram occurrences="114" value="ï_" /> + <ngram occurrences="98" value="é_" /> + <ngram occurrences="92" value="í" /> + <ngram occurrences="91" value="ñ" /> + <ngram occurrences="90" value="_ð" /> + <ngram occurrences="82" value="¨_" /> + <ngram occurrences="79" value="ú" /> + <ngram occurrences="66" value="â" /> + <ngram occurrences="63" value="_ó" /> + <ngram occurrences="58" value="õ_" /> + <ngram occurrences="58" value="ç" /> + <ngram occurrences="58" value="å_" /> + <ngram occurrences="57" value="_ä" /> + <ngram occurrences="56" value="_¨" /> + <ngram occurrences="53" value="_ú" /> + <ngram occurrences="52" value="þ" /> + <ngram occurrences="52" value="ñ_" /> + <ngram occurrences="50" value="ø" /> + <ngram occurrences="50" value="_î" /> + <ngram occurrences="49" value="_ô" /> + <ngram occurrences="44" value="îá" /> + <ngram occurrences="40" value="òï" /> + <ngram occurrences="40" value="ðï" /> + <ngram occurrences="40" value="ê" /> + <ngram occurrences="40" value="_ï" /> + <ngram occurrences="38" value="è" /> + <ngram occurrences="38" value="_ë" /> + <ngram occurrences="38" value="_â" /> + <ngram occurrences="35" value="ö" /> + <ngram occurrences="34" value="îá_" /> + <ngram occurrences="34" value="äï" /> + <ngram occurrences="33" value="ïò" /> + <ngram occurrences="33" value="ëá" /> + <ngram occurrences="32" value="û" /> + <ngram occurrences="32" value="ôé" /> + <ngram occurrences="32" value="í_" /> + <ngram occurrences="32" value="_ðï" /> + <ngram occurrences="31" value="ìé" /> + <ngram occurrences="30" value="úá" /> + <ngram occurrences="30" value="óô" /> + <ngram occurrences="30" value="à" /> + <ngram occurrences="29" value="ôá" /> + <ngram occurrences="29" value="ê_" /> + <ngram occurrences="29" value="ã" /> + <ngram occurrences="28" value="éô" /> + <ngram occurrences="28" value="_í" /> + <ngram occurrences="28" value="_á" /> + <ngram occurrences="27" value="¨ä" /> + <ngram occurrences="27" value="ý" /> + <ngram occurrences="27" value="ôï" /> + <ngram occurrences="27" value="òé" /> + <ngram occurrences="27" value="ïí" /> + <ngram occurrences="27" value="îé" /> + <ngram occurrences="27" value="ìï" /> + <ngram occurrences="27" value="ëé" /> + <ngram occurrences="27" value="áì" /> + <ngram occurrences="26" value="ôø" /> + <ngram occurrences="26" value="òá" /> + <ngram occurrences="26" value="ïä" /> + <ngram occurrences="26" value="_ñ" /> + <ngram occurrences="25" value="ø_" /> + <ngram occurrences="25" value="çï" /> + <ngram occurrences="25" value="_äï" /> + <ngram occurrences="24" value="ðò" /> + <ngram occurrences="24" value="éî" /> + <ngram occurrences="24" value="_úá" /> + <ngram occurrences="23" value="ïó" /> + <ngram occurrences="23" value="ïì" /> + <ngram occurrences="23" value="ëï" /> + <ngram occurrences="23" value="à_" /> + <ngram occurrences="23" value="_þ" /> + <ngram occurrences="23" value="_îá" /> + <ngram occurrences="23" value="_é" /> + <ngram occurrences="22" value="åò" /> + <ngram occurrences="22" value="äá" /> + <ngram occurrences="22" value="_ò" /> + <ngram occurrences="22" value="_ðò" /> + <ngram occurrences="21" value="î¨" /> + <ngram occurrences="20" value="¨ì" /> + <ngram occurrences="20" value="ú_" /> + <ngram occurrences="20" value="ïç" /> + <ngram occurrences="20" value="îå" /> + <ngram occurrences="20" value="äï_" /> + <ngram occurrences="19" value="ôø_" /> + <ngram occurrences="19" value="óñ" /> + <ngram occurrences="19" value="ëé_" /> + <ngram occurrences="19" value="áò" /> + <ngram occurrences="19" value="_ý" /> + <ngram occurrences="19" value="_ç" /> + <ngram occurrences="18" value="ýï" /> + <ngram occurrences="18" value="óñ_" /> + <ngram occurrences="18" value="î¨_" /> + <ngram occurrences="18" value="åî" /> + <ngram occurrences="17" value="¨î" /> + <ngram occurrences="17" value="õä" /> + <ngram occurrences="17" value="ôé_" /> + <ngram occurrences="17" value="ð¨" /> + <ngram occurrences="17" value="ïâ" /> + <ngram occurrences="17" value="é_ð" /> + <ngram occurrences="17" value="áô" /> + <ngram occurrences="16" value="ï_¨" /> + <ngram occurrences="16" value="îï" /> + <ngram occurrences="16" value="è_" /> + <ngram occurrences="16" value="ä¨" /> + <ngram occurrences="16" value="_ýï" /> + <ngram occurrences="16" value="_îå" /> + <ngram occurrences="16" value="_îá_" /> + <ngram occurrences="16" value="_ã" /> + <ngram occurrences="15" value="ýï_" /> + <ngram occurrences="15" value="öå" /> + <ngram occurrences="15" value="ïà_" /> + <ngram occurrences="15" value="ïà" /> + <ngram occurrences="15" value="ìé_" /> + <ngram occurrences="15" value="ìá" /> + <ngram occurrences="15" value="ë_" /> + <ngram occurrences="15" value="çá" /> + <ngram occurrences="15" value="á_ä" /> + <ngram occurrences="15" value="_¨_" /> + <ngram occurrences="15" value="_ú_" /> + <ngram occurrences="15" value="_ëá" /> + <ngram occurrences="15" value="_è" /> + <ngram occurrences="15" value="_äï_" /> + <ngram occurrences="14" value="öå_" /> + <ngram occurrences="14" value="ôå" /> + <ngram occurrences="14" value="ôá_" /> + <ngram occurrences="14" value="ò¨" /> + <ngram occurrences="14" value="ïçï" /> + <ngram occurrences="14" value="íõ" /> + <ngram occurrences="14" value="íï" /> + <ngram occurrences="14" value="ì¨" /> + <ngram occurrences="14" value="ëá_" /> + <ngram occurrences="14" value="éê_" /> + <ngram occurrences="14" value="éê" /> + <ngram occurrences="14" value="çï_" /> + <ngram occurrences="14" value="äå" /> + <ngram occurrences="14" value="ä_" /> + <ngram occurrences="14" value="â¨" /> + <ngram occurrences="14" value="_¨ä" /> + <ngram occurrences="14" value="_ýï_" /> + <ngram occurrences="14" value="_ð¨" /> + <ngram occurrences="14" value="_å" /> + <ngram occurrences="13" value="ñë" /> + <ngram occurrences="13" value="ïí_" /> + <ngram occurrences="13" value="ïìï" /> + <ngram occurrences="13" value="îõ" /> + <ngram occurrences="13" value="ìñ" /> + <ngram occurrences="13" value="éì" /> + <ngram occurrences="13" value="èï" /> + <ngram occurrences="13" value="äõ" /> + <ngram occurrences="13" value="äî" /> + <ngram occurrences="13" value="äé" /> + <ngram occurrences="13" value="ã¨" /> + <ngram occurrences="13" value="âõ" /> + <ngram occurrences="13" value="áî" /> + <ngram occurrences="13" value="i" /> + <ngram occurrences="13" value="_óô" /> + <ngram occurrences="12" value="þé" /> + <ngram occurrences="12" value="þå" /> + <ngram occurrences="12" value="øë" /> + <ngram occurrences="12" value="ó_" /> + <ngram occurrences="12" value="ðòï" /> + <ngram occurrences="12" value="ðï_" /> + <ngram occurrences="12" value="îå_" /> + <ngram occurrences="12" value="íõ_" /> + <ngram occurrences="12" value="ìå" /> + <ngram occurrences="12" value="éó" /> + <ngram occurrences="12" value="éë" /> + <ngram occurrences="12" value="äá_" /> + <ngram occurrences="12" value="á_ô" /> + <ngram occurrences="12" value="_û" /> + <ngram occurrences="12" value="_ö" /> + <ngram occurrences="12" value="_õ" /> + <ngram occurrences="12" value="_ñë" /> + <ngram occurrences="12" value="_ì" /> + <ngram occurrences="12" value="_âõ" /> + <ngram occurrences="11" value="þï" /> + <ngram occurrences="11" value="úá_" /> + <ngram occurrences="11" value="ô¨" /> + <ngram occurrences="11" value="óôï" /> + <ngram occurrences="11" value="ðé" /> + <ngram occurrences="11" value="ïòï" /> + <ngram occurrences="11" value="ïíõ_" /> + <ngram occurrences="11" value="ïíõ" /> + <ngram occurrences="11" value="ïçï_" /> + <ngram occurrences="11" value="î_" /> + <ngram occurrences="11" value="íá" /> + <ngram occurrences="11" value="âé" /> + <ngram occurrences="11" value="áö" /> + <ngram occurrences="11" value="áä" /> + <ngram occurrences="11" value="á_ó" /> + <ngram occurrences="11" value="á_ð" /> + <ngram occurrences="11" value="_ðòï" /> + <ngram occurrences="10" value="¨ô" /> + <ngram occurrences="10" value="¨_î" /> + <ngram occurrences="10" value="ôïò" /> + <ngram occurrences="10" value="ðå" /> + <ngram occurrences="10" value="ðá" /> + <ngram occurrences="10" value="ïþ" /> + <ngram occurrences="10" value="ìø" /> + <ngram occurrences="10" value="ìï_" /> + <ngram occurrences="10" value="é_ó" /> + <ngram occurrences="10" value="é_ðï" /> + <ngram occurrences="10" value="åí" /> + <ngram occurrences="10" value="ä¨_" /> + <ngram occurrences="10" value="_úá_" /> + <ngram occurrences="10" value="_ó_" /> + <ngram occurrences="10" value="_òï" /> + <ngram occurrences="10" value="_ï_" /> + <ngram occurrences="10" value="_îå_" /> + <ngram occurrences="9" value="ô_" /> + <ngram occurrences="9" value="óé" /> + <ngram occurrences="9" value="òô" /> + <ngram occurrences="9" value="ò_" /> + <ngram occurrences="9" value="ð¨ä" /> + <ngram occurrences="9" value="ïî" /> + <ngram occurrences="9" value="ïë" /> + <ngram occurrences="9" value="ï_ð" /> + <ngram occurrences="9" value="îñ" /> + <ngram occurrences="9" value="îî" /> + <ngram occurrences="9" value="ë¨" /> + <ngram occurrences="9" value="ëõ" /> + <ngram occurrences="9" value="ëáö" /> + <ngram occurrences="9" value="áôé" /> + <ngram occurrences="9" value="áí" /> + <ngram occurrences="9" value="áë" /> + <ngram occurrences="9" value="_õ_" /> + <ngram occurrences="9" value="_ôï" /> + <ngram occurrences="9" value="_ôá" /> + <ngram occurrences="9" value="_ð¨ä" /> + <ngram occurrences="9" value="_íï" /> + <ngram occurrences="9" value="_â¨" /> + <ngram occurrences="8" value="¨ó" /> + <ngram occurrences="8" value="¨ìø" /> + <ngram occurrences="8" value="¨_¨" /> + <ngram occurrences="8" value="¨_ó" /> + <ngram occurrences="8" value="¨_ð" /> + <ngram occurrences="8" value="úî" /> + <ngram occurrences="8" value="õì" /> + <ngram occurrences="8" value="òõ" /> + <ngram occurrences="8" value="òå" /> + <ngram occurrences="8" value="ðòé" /> + <ngram occurrences="8" value="ï_ï" /> + <ngram occurrences="8" value="îõ_" /> + <ngram occurrences="8" value="îñ_" /> + <ngram occurrences="8" value="íé" /> + <ngram occurrences="8" value="ìå_" /> + <ngram occurrences="8" value="éôø_" /> + <ngram occurrences="8" value="éôø" /> + <ngram occurrences="8" value="éôé" /> + <ngram occurrences="8" value="åó" /> + <ngram occurrences="8" value="åì" /> + <ngram occurrences="8" value="äõ_" /> + <ngram occurrences="8" value="ã¨_" /> + <ngram occurrences="8" value="âá" /> + <ngram occurrences="8" value="áìå" /> + <ngram occurrences="8" value="á_ú" /> + <ngram occurrences="8" value="_þï" /> + <ngram occurrences="8" value="_ôé" /> + <ngram occurrences="8" value="_ñ_" /> + <ngram occurrences="8" value="_ðé" /> + <ngram occurrences="8" value="_ëáö" /> + <ngram occurrences="8" value="_çï" /> + <ngram occurrences="7" value="¨ë" /> + <ngram occurrences="7" value="¨ê" /> + <ngram occurrences="7" value="¨äð" /> + <ngram occurrences="7" value="ôõ" /> + <ngram occurrences="7" value="óø" /> + <ngram occurrences="7" value="óõ" /> + <ngram occurrences="7" value="óï" /> + <ngram occurrences="7" value="òá_" /> + <ngram occurrences="7" value="ñ_ó" /> + <ngram occurrences="7" value="ïú" /> + <ngram occurrences="7" value="ïò¨" /> + <ngram occurrences="7" value="ïìï_" /> + <ngram occurrences="7" value="ïä¨" /> + <ngram occurrences="7" value="ï_¨ä" /> + <ngram occurrences="7" value="ï_ë" /> + <ngram occurrences="7" value="ï_é" /> + <ngram occurrences="7" value="ï_ä" /> + <ngram occurrences="7" value="îë" /> + <ngram occurrences="7" value="îé_" /> + <ngram occurrences="7" value="íé_" /> + <ngram occurrences="7" value="ìïó" /> + <ngram occurrences="7" value="ìá_" /> + <ngram occurrences="7" value="ëáöå_" /> + <ngram occurrences="7" value="ëáöå" /> + <ngram occurrences="7" value="éí" /> + <ngram occurrences="7" value="éè_" /> + <ngram occurrences="7" value="éè" /> + <ngram occurrences="7" value="é_í" /> + <ngram occurrences="7" value="é_ä" /> + <ngram occurrences="7" value="å_ó" /> + <ngram occurrences="7" value="å_ð" /> + <ngram occurrences="7" value="äð" /> + <ngram occurrences="7" value="áú" /> + <ngram occurrences="7" value="áöå_" /> + <ngram occurrences="7" value="áöå" /> + <ngram occurrences="7" value="áó" /> + <ngram occurrences="7" value="áìé" /> + <ngram occurrences="7" value="á_û" /> + <ngram occurrences="7" value="á_â" /> + <ngram occurrences="7" value="_þé" /> + <ngram occurrences="7" value="_óôï" /> + <ngram occurrences="7" value="_óï" /> + <ngram occurrences="7" value="_ðòé" /> + <ngram occurrences="7" value="_ðï_" /> + <ngram occurrences="7" value="_ëï" /> + <ngram occurrences="7" value="_ëáöå" /> + <ngram occurrences="7" value="_ê" /> + <ngram occurrences="7" value="_é_" /> + <ngram occurrences="7" value="_áì" /> + <ngram occurrences="7" value="_á_" /> + <ngram occurrences="6" value="¨ò" /> + <ngram occurrences="6" value="¨ñ" /> + <ngram occurrences="6" value="¨îë" /> + <ngram occurrences="6" value="¨ìøë" /> + <ngram occurrences="6" value="¨äá_" /> + <ngram occurrences="6" value="¨äá" /> + <ngram occurrences="6" value="¨_ú" /> + <ngram occurrences="6" value="¨_ðò" /> + <ngram occurrences="6" value="¨_ë" /> + <ngram occurrences="6" value="¨_ä" /> + <ngram occurrences="6" value="þïìï_" /> + <ngram occurrences="6" value="þïìï" /> + <ngram occurrences="6" value="þïì" /> + <ngram occurrences="6" value="þåî" /> + <ngram occurrences="6" value="þá" /> + <ngram occurrences="6" value="ýå" /> + <ngram occurrences="6" value="ûé" /> + <ngram occurrences="6" value="úîá" /> + <ngram occurrences="6" value="øó" /> + <ngram occurrences="6" value="øëé_" /> + <ngram occurrences="6" value="øëé" /> + <ngram occurrences="6" value="õò" /> + <ngram occurrences="6" value="õ_ó" /> + <ngram occurrences="6" value="õ_ð" /> + <ngram occurrences="6" value="ô¨_" /> + <ngram occurrences="6" value="ôò" /> + <ngram occurrences="6" value="ó¨" /> + <ngram occurrences="6" value="óôïò" /> + <ngram occurrences="6" value="óôá" /> + <ngram occurrences="6" value="óì" /> + <ngram occurrences="6" value="óå" /> + <ngram occurrences="6" value="ò¨_" /> + <ngram occurrences="6" value="òïú" /> + <ngram occurrences="6" value="òî" /> + <ngram occurrences="6" value="òé_" /> + <ngram occurrences="6" value="ñ_ú" /> + <ngram occurrences="6" value="ñ_ð" /> + <ngram occurrences="6" value="ñ_ä" /> + <ngram occurrences="6" value="ðï_¨" /> + <ngram occurrences="6" value="ðåò" /> + <ngram occurrences="6" value="ïóô" /> + <ngram occurrences="6" value="ïòá" /> + <ngram occurrences="6" value="ïìï_¨" /> + <ngram occurrences="6" value="ïäé" /> + <ngram occurrences="6" value="ï_¨ë" /> + <ngram occurrences="6" value="ï_ó" /> + <ngram occurrences="6" value="îï_" /> + <ngram occurrences="6" value="îîñ" /> + <ngram occurrences="6" value="íï_" /> + <ngram occurrences="6" value="ìøë" /> + <ngram occurrences="6" value="ìñ_" /> + <ngram occurrences="6" value="ìï_¨ë" /> + <ngram occurrences="6" value="ìï_¨" /> + <ngram occurrences="6" value="ëõ_" /> + <ngram occurrences="6" value="ëò" /> + <ngram occurrences="6" value="éî_" /> + <ngram occurrences="6" value="èïä" /> + <ngram occurrences="6" value="æ" /> + <ngram occurrences="6" value="åê" /> + <ngram occurrences="6" value="å_î" /> + <ngram occurrences="6" value="âõä" /> + <ngram occurrences="6" value="âï" /> + <ngram occurrences="6" value="áôé_" /> + <ngram occurrences="6" value="áð" /> + <ngram occurrences="6" value="áí_" /> + <ngram occurrences="6" value="à_ð" /> + <ngram occurrences="6" value="i_" /> + <ngram occurrences="6" value="_¨ë" /> + <ngram occurrences="6" value="_þïìï" /> + <ngram occurrences="6" value="_þïì" /> + <ngram occurrences="6" value="_ô¨" /> + <ngram occurrences="6" value="_ôå" /> +</ngrams> diff --git a/src/plugins/language/vietnamese.klp b/src/plugins/language/vietnamese.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="1220" value="_" /> + <ngram occurrences="445" value="n" /> + <ngram occurrences="350" value="h" /> + <ngram occurrences="237" value="t" /> + <ngram occurrences="213" value="c" /> + <ngram occurrences="207" value="i" /> + <ngram occurrences="201" value="_t" /> + <ngram occurrences="191" value="g" /> + <ngram occurrences="190" value="_n" /> + <ngram occurrences="167" value="_c" /> + <ngram occurrences="163" value="i_" /> + <ngram occurrences="157" value="ng" /> + <ngram occurrences="132" value="a" /> + <ngram occurrences="127" value="g_" /> + <ngram occurrences="126" value="n_" /> + <ngram occurrences="121" value="ng_" /> + <ngram occurrences="115" value="u" /> + <ngram occurrences="114" value="nh" /> + <ngram occurrences="108" value="à" /> + <ngram occurrences="103" value="h_" /> + <ngram occurrences="82" value="m" /> + <ngram occurrences="73" value="c_" /> + <ngram occurrences="72" value="l" /> + <ngram occurrences="70" value="o" /> + <ngram occurrences="68" value="_ng" /> + <ngram occurrences="67" value="th" /> + <ngram occurrences="67" value="nh_" /> + <ngram occurrences="67" value="_th" /> + <ngram occurrences="66" value="r" /> + <ngram occurrences="64" value="ü" /> + <ngram occurrences="63" value="ç" /> + <ngram occurrences="63" value="_ç" /> + <ngram occurrences="62" value="t_" /> + <ngram occurrences="60" value="s" /> + <ngram occurrences="58" value="u_" /> + <ngram occurrences="58" value="_l" /> + <ngram occurrences="57" value="_nh" /> + <ngram occurrences="55" value="m_" /> + <ngram occurrences="55" value="a_" /> + <ngram occurrences="55" value="_s" /> + <ngram occurrences="55" value="_h" /> + <ngram occurrences="54" value="ó" /> + <ngram occurrences="53" value="_m" /> + <ngram occurrences="52" value="ü_" /> + <ngram occurrences="51" value="y" /> + <ngram occurrences="49" value="á" /> + <ngram occurrences="47" value="y_" /> + <ngram occurrences="47" value="v" /> + <ngram occurrences="47" value="_v" /> + <ngram occurrences="46" value="ch" /> + <ngram occurrences="44" value="o_" /> + <ngram occurrences="42" value="k" /> + <ngram occurrences="41" value="_i" /> + <ngram occurrences="40" value="à_" /> + <ngram occurrences="40" value="_k" /> + <ngram occurrences="40" value="_i_" /> + <ngram occurrences="39" value="_c_" /> + <ngram occurrences="38" value="hi" /> + <ngram occurrences="37" value="p" /> + <ngram occurrences="37" value="kh" /> + <ngram occurrences="37" value="_kh" /> + <ngram occurrences="37" value="_ch" /> + <ngram occurrences="35" value="å" /> + <ngram occurrences="35" value="b" /> + <ngram occurrences="35" value="_b" /> + <ngram occurrences="34" value="_g" /> + <ngram occurrences="33" value="tr" /> + <ngram occurrences="33" value="d" /> + <ngram occurrences="33" value="_t_" /> + <ngram occurrences="33" value="_p" /> + <ngram occurrences="33" value="_ng_" /> + <ngram occurrences="32" value="hi_" /> + <ngram occurrences="31" value="ô" /> + <ngram occurrences="31" value="ó_" /> + <ngram occurrences="31" value="ã" /> + <ngram occurrences="31" value="ng_t" /> + <ngram occurrences="31" value="g_t" /> + <ngram occurrences="31" value="e" /> + <ngram occurrences="31" value="_tr" /> + <ngram occurrences="31" value="_d" /> + <ngram occurrences="30" value="û" /> + <ngram occurrences="30" value="ì" /> + <ngram occurrences="28" value="_n_" /> + <ngram occurrences="27" value="là" /> + <ngram occurrences="27" value="_là" /> + <ngram occurrences="26" value="ph" /> + <ngram occurrences="26" value="i_t" /> + <ngram occurrences="26" value="cû" /> + <ngram occurrences="26" value="an" /> + <ngram occurrences="26" value="_ph" /> + <ngram occurrences="26" value="_m_" /> + <ngram occurrences="26" value="_cû" /> + <ngram occurrences="25" value="àn" /> + <ngram occurrences="25" value="n_t" /> + <ngram occurrences="23" value="ê" /> + <ngram occurrences="23" value="æ" /> + <ngram occurrences="22" value="ôn" /> + <ngram occurrences="22" value="i_n" /> + <ngram occurrences="22" value="_u" /> + <ngram occurrences="21" value="ç_" /> + <ngram occurrences="21" value="ä" /> + <ngram occurrences="21" value="ha" /> + <ngram occurrences="21" value="có_" /> + <ngram occurrences="21" value="có" /> + <ngram occurrences="21" value="_ç_" /> + <ngram occurrences="21" value="_u_" /> + <ngram occurrences="21" value="_có_" /> + <ngram occurrences="21" value="_có" /> + <ngram occurrences="20" value="ûa_" /> + <ngram occurrences="20" value="ûa" /> + <ngram occurrences="20" value="là_" /> + <ngram occurrences="20" value="i_c" /> + <ngram occurrences="20" value="hü" /> + <ngram occurrences="20" value="hà" /> + <ngram occurrences="20" value="ho" /> + <ngram occurrences="20" value="cûa_" /> + <ngram occurrences="20" value="cûa" /> + <ngram occurrences="20" value="_là_" /> + <ngram occurrences="20" value="_cûa_" /> + <ngram occurrences="20" value="_cûa" /> + <ngram occurrences="19" value="â" /> + <ngram occurrences="19" value="qu" /> + <ngram occurrences="19" value="q" /> + <ngram occurrences="19" value="n_c" /> + <ngram occurrences="19" value="h_n" /> + <ngram occurrences="19" value="gi" /> + <ngram occurrences="19" value="_qu" /> + <ngram occurrences="19" value="_q" /> + <ngram occurrences="19" value="_gi" /> + <ngram occurrences="18" value="ác" /> + <ngram occurrences="18" value="i_u_" /> + <ngram occurrences="18" value="i_u" /> + <ngram occurrences="18" value="_r" /> + <ngram occurrences="17" value="ông_" /> + <ngram occurrences="17" value="ông" /> + <ngram occurrences="17" value="ì_" /> + <ngram occurrences="17" value="ên_" /> + <ngram occurrences="17" value="ên" /> + <ngram occurrences="17" value="uy" /> + <ngram occurrences="17" value="in" /> + <ngram occurrences="17" value="hi_u_" /> + <ngram occurrences="17" value="hi_u" /> + <ngram occurrences="17" value="h_t" /> + <ngram occurrences="17" value="ch_" /> + <ngram occurrences="16" value="nhi" /> + <ngram occurrences="16" value="hô" /> + <ngram occurrences="16" value="há" /> + <ngram occurrences="16" value="_nhi" /> + <ngram occurrences="15" value="ü_i_" /> + <ngram occurrences="15" value="ü_i" /> + <ngram occurrences="15" value="ö" /> + <ngram occurrences="15" value="ò" /> + <ngram occurrences="15" value="ân_" /> + <ngram occurrences="15" value="ân" /> + <ngram occurrences="15" value="và" /> + <ngram occurrences="15" value="ngü" /> + <ngram occurrences="15" value="gü" /> + <ngram occurrences="15" value="_và" /> + <ngram occurrences="15" value="_ngü" /> + <ngram occurrences="14" value="ü_c" /> + <ngram occurrences="14" value="ø" /> + <ngram occurrences="14" value="ãt_" /> + <ngram occurrences="14" value="ãt" /> + <ngram occurrences="14" value="uy_" /> + <ngram occurrences="14" value="sa" /> + <ngram occurrences="14" value="ra" /> + <ngram occurrences="14" value="ng_c" /> + <ngram occurrences="14" value="n_th" /> + <ngram occurrences="14" value="n_n" /> + <ngram occurrences="14" value="m_t" /> + <ngram occurrences="14" value="hì" /> + <ngram occurrences="14" value="h_c" /> + <ngram occurrences="14" value="g_c" /> + <ngram occurrences="14" value="_sa" /> + <ngram occurrences="14" value="_m_t" /> + <ngram occurrences="13" value="ü_n" /> + <ngram occurrences="13" value="ü_c_" /> + <ngram occurrences="13" value="ú" /> + <ngram occurrences="13" value="ù" /> + <ngram occurrences="13" value="ình_" /> + <ngram occurrences="13" value="ình" /> + <ngram occurrences="13" value="ìn" /> + <ngram occurrences="13" value="ån" /> + <ngram occurrences="13" value="åi_" /> + <ngram occurrences="13" value="åi" /> + <ngram occurrences="13" value="ngü_i" /> + <ngram occurrences="13" value="ngü_" /> + <ngram occurrences="13" value="ng_n" /> + <ngram occurrences="13" value="hü_" /> + <ngram occurrences="13" value="hôn" /> + <ngram occurrences="13" value="hì_" /> + <ngram occurrences="13" value="gü_i_" /> + <ngram occurrences="13" value="gü_i" /> + <ngram occurrences="13" value="gü_" /> + <ngram occurrences="13" value="g_n" /> + <ngram occurrences="13" value="a_t" /> + <ngram occurrences="13" value="_ngü_" /> + <ngram occurrences="12" value="ü_ng" /> + <ngram occurrences="12" value="on" /> + <ngram occurrences="12" value="nhi_u" /> + <ngram occurrences="12" value="nhi_" /> + <ngram occurrences="12" value="ng_th" /> + <ngram occurrences="12" value="m_t_" /> + <ngram occurrences="12" value="l_" /> + <ngram occurrences="12" value="không" /> + <ngram occurrences="12" value="khôn" /> + <ngram occurrences="12" value="khô" /> + <ngram occurrences="12" value="inh_" /> + <ngram occurrences="12" value="inh" /> + <ngram occurrences="12" value="hông_" /> + <ngram occurrences="12" value="hông" /> + <ngram occurrences="12" value="ho_" /> + <ngram occurrences="12" value="g_th" /> + <ngram occurrences="12" value="ay_" /> + <ngram occurrences="12" value="ay" /> + <ngram occurrences="12" value="_nhi_" /> + <ngram occurrences="12" value="_m_t_" /> + <ngram occurrences="12" value="_khôn" /> + <ngram occurrences="12" value="_khô" /> + <ngram occurrences="11" value="ü_ng_" /> + <ngram occurrences="11" value="ác_" /> + <ngram occurrences="11" value="àu_" /> + <ngram occurrences="11" value="àu" /> + <ngram occurrences="11" value="ào_" /> + <ngram occurrences="11" value="ào" /> + <ngram occurrences="11" value="x" /> + <ngram occurrences="11" value="u_c" /> + <ngram occurrences="11" value="t_n" /> + <ngram occurrences="11" value="s_" /> + <ngram occurrences="11" value="p_" /> + <ngram occurrences="11" value="nh_t" /> + <ngram occurrences="11" value="n_m" /> + <ngram occurrences="11" value="cá" /> + <ngram occurrences="11" value="c_n" /> + <ngram occurrences="11" value="c_c" /> + <ngram occurrences="11" value="_x" /> + <ngram occurrences="11" value="_cá" /> + <ngram occurrences="10" value="ön" /> + <ngram occurrences="10" value="çü_c_" /> + <ngram occurrences="10" value="çü_c" /> + <ngram occurrences="10" value="çü_" /> + <ngram occurrences="10" value="çü" /> + <ngram occurrences="10" value="ç_n" /> + <ngram occurrences="10" value="æn" /> + <ngram occurrences="10" value="án" /> + <ngram occurrences="10" value="á_" /> + <ngram occurrences="10" value="àng_" /> + <ngram occurrences="10" value="àng" /> + <ngram occurrences="10" value="à_c" /> + <ngram occurrences="10" value="ti" /> + <ngram occurrences="10" value="nhü" /> + <ngram occurrences="10" value="nh_n" /> + <ngram occurrences="10" value="nh_c" /> + <ngram occurrences="10" value="n_ç" /> + <ngram occurrences="10" value="h_ng" /> + <ngram occurrences="10" value="f" /> + <ngram occurrences="10" value="cho_" /> + <ngram occurrences="10" value="cho" /> + <ngram occurrences="10" value="an_" /> + <ngram occurrences="10" value="a_c" /> + <ngram occurrences="10" value="_çü_c" /> + <ngram occurrences="10" value="_çü_" /> + <ngram occurrences="10" value="_çü" /> + <ngram occurrences="10" value="_ç_n" /> + <ngram occurrences="10" value="_nhü" /> + <ngram occurrences="10" value="_nh_" /> + <ngram occurrences="10" value="_h_" /> + <ngram occurrences="10" value="_cho_" /> + <ngram occurrences="10" value="_cho" /> + <ngram occurrences="9" value="õ" /> + <ngram occurrences="9" value="ón" /> + <ngram occurrences="9" value="òn" /> + <ngram occurrences="9" value="î" /> + <ngram occurrences="9" value="ë" /> + <ngram occurrences="9" value="çã" /> + <ngram occurrences="9" value="ån_" /> + <ngram occurrences="9" value="ã_" /> + <ngram occurrences="9" value="ày_" /> + <ngram occurrences="9" value="ày" /> + <ngram occurrences="9" value="y_n" /> + <ngram occurrences="9" value="và_" /> + <ngram occurrences="9" value="u_t" /> + <ngram occurrences="9" value="u_n" /> + <ngram occurrences="9" value="thì_" /> + <ngram occurrences="9" value="thì" /> + <ngram occurrences="9" value="ta" /> + <ngram occurrences="9" value="ra_" /> + <ngram occurrences="9" value="o_n" /> + <ngram occurrences="9" value="nà" /> + <ngram occurrences="9" value="m_n" /> + <ngram occurrences="9" value="i_v" /> + <ngram occurrences="9" value="hàn" /> + <ngram occurrences="9" value="hu" /> + <ngram occurrences="9" value="các" /> + <ngram occurrences="9" value="c_t" /> + <ngram occurrences="9" value="anh_" /> + <ngram occurrences="9" value="anh" /> + <ngram occurrences="9" value="_çã" /> + <ngram occurrences="9" value="_và_" /> + <ngram occurrences="9" value="_ti" /> + <ngram occurrences="9" value="_thì_" /> + <ngram occurrences="9" value="_thì" /> + <ngram occurrences="9" value="_nà" /> + <ngram occurrences="9" value="_l_" /> + <ngram occurrences="9" value="_các" /> + <ngram occurrences="8" value="úc_" /> + <ngram occurrences="8" value="úc" /> + <ngram occurrences="8" value="í" /> + <ngram occurrences="8" value="ë_" /> + <ngram occurrences="8" value="çã_" /> + <ngram occurrences="8" value="æn_" /> + <ngram occurrences="8" value="ành_" /> + <ngram occurrences="8" value="ành" /> + <ngram occurrences="8" value="un" /> + <ngram occurrences="8" value="tu" /> + <ngram occurrences="8" value="trong" /> + <ngram occurrences="8" value="tron" /> + <ngram occurrences="8" value="tro" /> + <ngram occurrences="8" value="t_c" /> + <ngram occurrences="8" value="só" /> + <ngram occurrences="8" value="rong_" /> + <ngram occurrences="8" value="rong" /> + <ngram occurrences="8" value="ron" /> + <ngram occurrences="8" value="ro" /> + <ngram occurrences="8" value="ong_" /> + <ngram occurrences="8" value="ong" /> + <ngram occurrences="8" value="o_t" /> + <ngram occurrences="8" value="nhü_" /> + <ngram occurrences="8" value="n_l" /> + <ngram occurrences="8" value="khá" /> + <ngram occurrences="8" value="i_l" /> + <ngram occurrences="8" value="hú" /> + <ngram occurrences="8" value="hay_" /> + <ngram occurrences="8" value="hay" /> + <ngram occurrences="8" value="h_th" /> + <ngram occurrences="8" value="h_s" /> + <ngram occurrences="8" value="gi_" /> + <ngram occurrences="8" value="b_" /> + <ngram occurrences="8" value="au_" /> + <ngram occurrences="8" value="au" /> + <ngram occurrences="8" value="ai_" /> + <ngram occurrences="8" value="ai" /> + <ngram occurrences="8" value="_çã_" /> + <ngram occurrences="8" value="_tron" /> + <ngram occurrences="8" value="_tro" /> + <ngram occurrences="8" value="_só" /> + <ngram occurrences="8" value="_s_" /> + <ngram occurrences="8" value="_nhü_" /> + <ngram occurrences="8" value="_ng_t" /> + <ngram occurrences="8" value="_n_c" /> + <ngram occurrences="8" value="_khá" /> + <ngram occurrences="8" value="_gi_" /> + <ngram occurrences="8" value="_ch_" /> + <ngram occurrences="8" value="_b_" /> + <ngram occurrences="8" value="_a" /> + <ngram occurrences="7" value="ø_" /> + <ngram occurrences="7" value="ó_n" /> + <ngram occurrences="7" value="ñ" /> + <ngram occurrences="7" value="ách_" /> + <ngram occurrences="7" value="ách" /> + <ngram occurrences="7" value="àn_" /> + <ngram occurrences="7" value="àm_" /> + <ngram occurrences="7" value="àm" /> + <ngram occurrences="7" value="à_t" /> + <ngram occurrences="7" value="º" /> + <ngram occurrences="7" value="y_t" /> + <ngram occurrences="7" value="y_n_" /> + <ngram occurrences="7" value="y_c" /> + <ngram occurrences="7" value="vi" /> + <ngram occurrences="7" value="v_" /> + <ngram occurrences="7" value="uy_n" /> + <ngram occurrences="7" value="ua" /> + <ngram occurrences="7" value="tô" /> + <ngram occurrences="7" value="tå" /> + <ngram occurrences="7" value="tha" /> + <ngram occurrences="7" value="re" /> + <ngram occurrences="7" value="nh_h" /> + <ngram occurrences="7" value="ng_ç" /> + <ngram occurrences="7" value="ng_b" /> + <ngram occurrences="7" value="lå" /> + <ngram occurrences="7" value="iê" /> + <ngram occurrences="7" value="i_ç" /> + <ngram occurrences="7" value="i_t_" /> + <ngram occurrences="7" value="i_n_" /> + <ngram occurrences="7" value="i_d" /> + <ngram occurrences="7" value="hõ" /> + <ngram occurrences="7" value="hó" /> + <ngram occurrences="7" value="hã" /> + <ngram occurrences="7" value="h_ng_" /> + <ngram occurrences="7" value="h_h" /> + <ngram occurrences="7" value="g_ç" /> + <ngram occurrences="7" value="g_b" /> + <ngram occurrences="7" value="c_ç" /> + <ngram occurrences="7" value="ar" /> + <ngram occurrences="7" value="ao_" /> + <ngram occurrences="7" value="ao" /> + <ngram occurrences="7" value="al" /> + <ngram occurrences="7" value="_ñ" /> + <ngram occurrences="7" value="_vi" /> + <ngram occurrences="7" value="_v_" /> +</ngrams> diff --git a/src/plugins/language/welsh.klp b/src/plugins/language/welsh.klp @@ -0,0 +1,404 @@ +<?xml version="1.0" encoding="UTF-8" ?> +<!DOCTYPE klp SYSTEM "klp.dtd"> +<ngrams> + <ngram occurrences="802" value="_" /> + <ngram occurrences="356" value="y" /> + <ngram occurrences="353" value="d" /> + <ngram occurrences="342" value="a" /> + <ngram occurrences="292" value="n" /> + <ngram occurrences="291" value="e" /> + <ngram occurrences="269" value="r" /> + <ngram occurrences="255" value="i" /> + <ngram occurrences="181" value="o" /> + <ngram occurrences="164" value="l" /> + <ngram occurrences="154" value="h" /> + <ngram occurrences="147" value="g" /> + <ngram occurrences="136" value="_y" /> + <ngram occurrences="127" value="f" /> + <ngram occurrences="126" value="t" /> + <ngram occurrences="125" value="w" /> + <ngram occurrences="120" value="n_" /> + <ngram occurrences="107" value="dd" /> + <ngram occurrences="99" value="u" /> + <ngram occurrences="97" value="m" /> + <ngram occurrences="96" value="s" /> + <ngram occurrences="92" value="c" /> + <ngram occurrences="90" value="d_" /> + <ngram occurrences="89" value="yn" /> + <ngram occurrences="89" value="r_" /> + <ngram occurrences="81" value="_a" /> + <ngram occurrences="68" value="u_" /> + <ngram occurrences="67" value="yn_" /> + <ngram occurrences="65" value="yd" /> + <ngram occurrences="64" value="th" /> + <ngram occurrences="64" value="l_" /> + <ngram occurrences="61" value="i_" /> + <ngram occurrences="61" value="_g" /> + <ngram occurrences="60" value="_yn" /> + <ngram occurrences="57" value="_d" /> + <ngram occurrences="56" value="_yn_" /> + <ngram occurrences="55" value="_i" /> + <ngram occurrences="53" value="ym" /> + <ngram occurrences="49" value="ydd" /> + <ngram occurrences="49" value="_c" /> + <ngram occurrences="48" value="y_" /> + <ngram occurrences="48" value="h_" /> + <ngram occurrences="48" value="b" /> + <ngram occurrences="48" value="ae" /> + <ngram occurrences="45" value="wy" /> + <ngram occurrences="44" value="g_" /> + <ngram occurrences="43" value="ra" /> + <ngram occurrences="43" value="o_" /> + <ngram occurrences="43" value="ia" /> + <ngram occurrences="43" value="an" /> + <ngram occurrences="42" value="ol" /> + <ngram occurrences="42" value="ar" /> + <ngram occurrences="42" value="_r" /> + <ngram occurrences="41" value="th_" /> + <ngram occurrences="40" value="ei" /> + <ngram occurrences="39" value="dd_" /> + <ngram occurrences="39" value="_y_" /> + <ngram occurrences="38" value="_n" /> + <ngram occurrences="37" value="di" /> + <ngram occurrences="36" value="ol_" /> + <ngram occurrences="36" value="_e" /> + <ngram occurrences="35" value="ed" /> + <ngram occurrences="33" value="gy" /> + <ngram occurrences="33" value="cy" /> + <ngram occurrences="33" value="ai" /> + <ngram occurrences="33" value="_s" /> + <ngram occurrences="32" value="da" /> + <ngram occurrences="32" value="_r_" /> + <ngram occurrences="32" value="_cy" /> + <ngram occurrences="31" value="p" /> + <ngram occurrences="31" value="ne" /> + <ngram occurrences="31" value="er" /> + <ngram occurrences="31" value="a_" /> + <ngram occurrences="30" value="ith" /> + <ngram occurrences="30" value="it" /> + <ngram occurrences="30" value="au_" /> + <ngram occurrences="30" value="au" /> + <ngram occurrences="30" value="_m" /> + <ngram occurrences="30" value="_i_" /> + <ngram occurrences="30" value="_h" /> + <ngram occurrences="28" value="od" /> + <ngram occurrences="28" value="n_y" /> + <ngram occurrences="28" value="en" /> + <ngram occurrences="28" value="de" /> + <ngram occurrences="28" value="_p" /> + <ngram occurrences="28" value="_gy" /> + <ngram occurrences="28" value="_f" /> + <ngram occurrences="27" value="ha" /> + <ngram occurrences="26" value="yr" /> + <ngram occurrences="26" value="wyd" /> + <ngram occurrences="26" value="ddi" /> + <ngram occurrences="25" value="mr" /> + <ngram occurrences="25" value="eg" /> + <ngram occurrences="24" value="ymr" /> + <ngram occurrences="24" value="ll" /> + <ngram occurrences="24" value="fe" /> + <ngram occurrences="24" value="_o" /> + <ngram occurrences="24" value="_ar" /> + <ngram occurrences="23" value="ri" /> + <ngram occurrences="23" value="io" /> + <ngram occurrences="23" value="if" /> + <ngram occurrences="23" value="hy" /> + <ngram occurrences="23" value="ad" /> + <ngram occurrences="23" value="_dd" /> + <ngram occurrences="22" value="yn_y" /> + <ngram occurrences="22" value="wn" /> + <ngram occurrences="22" value="s_" /> + <ngram occurrences="22" value="eg_" /> + <ngram occurrences="22" value="d_y" /> + <ngram occurrences="22" value="_a_" /> + <ngram occurrences="21" value="rae" /> + <ngram occurrences="21" value="ny" /> + <ngram occurrences="21" value="no" /> + <ngram occurrences="21" value="ew" /> + <ngram occurrences="21" value="_b" /> + <ngram occurrences="20" value="ydd_" /> + <ngram occurrences="20" value="wydd" /> + <ngram occurrences="20" value="gym" /> + <ngram occurrences="20" value="_yn_y" /> + <ngram occurrences="20" value="_gym" /> + <ngram occurrences="19" value="yf" /> + <ngram occurrences="19" value="eth" /> + <ngram occurrences="19" value="et" /> + <ngram occurrences="19" value="do" /> + <ngram occurrences="19" value="ch" /> + <ngram occurrences="18" value="rh" /> + <ngram occurrences="18" value="nydd" /> + <ngram occurrences="18" value="nyd" /> + <ngram occurrences="18" value="la" /> + <ngram occurrences="18" value="ho" /> + <ngram occurrences="18" value="eu" /> + <ngram occurrences="18" value="el" /> + <ngram occurrences="18" value="ef" /> + <ngram occurrences="18" value="at" /> + <ngram occurrences="17" value="yr_" /> + <ngram occurrences="17" value="ymrae" /> + <ngram occurrences="17" value="ymra" /> + <ngram occurrences="17" value="raeg_" /> + <ngram occurrences="17" value="raeg" /> + <ngram occurrences="17" value="mraeg" /> + <ngram occurrences="17" value="mrae" /> + <ngram occurrences="17" value="mra" /> + <ngram occurrences="17" value="me" /> + <ngram occurrences="17" value="ith_" /> + <ngram occurrences="17" value="er_" /> + <ngram occurrences="17" value="aeth" /> + <ngram occurrences="17" value="aet" /> + <ngram occurrences="17" value="aeg_" /> + <ngram occurrences="17" value="aeg" /> + <ngram occurrences="16" value="wn_" /> + <ngram occurrences="16" value="r_g" /> + <ngram occurrences="16" value="nt" /> + <ngram occurrences="16" value="ni" /> + <ngram occurrences="16" value="n_y_" /> + <ngram occurrences="16" value="le" /> + <ngram occurrences="16" value="fa" /> + <ngram occurrences="16" value="eth_" /> + <ngram occurrences="16" value="aith_" /> + <ngram occurrences="16" value="aith" /> + <ngram occurrences="16" value="ait" /> + <ngram occurrences="16" value="_w" /> + <ngram occurrences="16" value="_o_" /> + <ngram occurrences="15" value="ys" /> + <ngram occurrences="15" value="yddi" /> + <ngram occurrences="15" value="we" /> + <ngram occurrences="15" value="t_" /> + <ngram occurrences="15" value="si" /> + <ngram occurrences="15" value="ng" /> + <ngram occurrences="15" value="iai" /> + <ngram occurrences="15" value="gymr" /> + <ngram occurrences="15" value="gw" /> + <ngram occurrences="15" value="ga" /> + <ngram occurrences="15" value="g_y" /> + <ngram occurrences="15" value="fn" /> + <ngram occurrences="15" value="ff" /> + <ngram occurrences="15" value="efn" /> + <ngram occurrences="15" value="edd" /> + <ngram occurrences="15" value="c_" /> + <ngram occurrences="15" value="aeth_" /> + <ngram occurrences="15" value="ac" /> + <ngram occurrences="15" value="_yr_" /> + <ngram occurrences="15" value="_yr" /> + <ngram occurrences="15" value="_ia" /> + <ngram occurrences="15" value="_gymr" /> + <ngram occurrences="14" value="yn_y_" /> + <ngram occurrences="14" value="ro" /> + <ngram occurrences="14" value="nn" /> + <ngram occurrences="14" value="l_y" /> + <ngram occurrences="14" value="io_" /> + <ngram occurrences="14" value="iaith" /> + <ngram occurrences="14" value="iait" /> + <ngram occurrences="14" value="gymra" /> + <ngram occurrences="14" value="d_yn" /> + <ngram occurrences="14" value="_ne" /> + <ngram occurrences="14" value="_me" /> + <ngram occurrences="14" value="_l" /> + <ngram occurrences="14" value="_hy" /> + <ngram occurrences="14" value="_ei" /> + <ngram occurrences="13" value="wr" /> + <ngram occurrences="13" value="rha" /> + <ngram occurrences="13" value="oed" /> + <ngram occurrences="13" value="oe" /> + <ngram occurrences="13" value="ma" /> + <ngram occurrences="13" value="fnydd" /> + <ngram occurrences="13" value="fnyd" /> + <ngram occurrences="13" value="fny" /> + <ngram occurrences="13" value="eith" /> + <ngram occurrences="13" value="eit" /> + <ngram occurrences="13" value="efnyd" /> + <ngram occurrences="13" value="efny" /> + <ngram occurrences="13" value="defny" /> + <ngram occurrences="13" value="defn" /> + <ngram occurrences="13" value="def" /> + <ngram occurrences="13" value="dde" /> + <ngram occurrences="13" value="al" /> + <ngram occurrences="13" value="_gw" /> + <ngram occurrences="13" value="_da" /> + <ngram occurrences="12" value="sy" /> + <ngram occurrences="12" value="rt" /> + <ngram occurrences="12" value="rif" /> + <ngram occurrences="12" value="rd" /> + <ngram occurrences="12" value="r_y" /> + <ngram occurrences="12" value="oedd" /> + <ngram occurrences="12" value="o_r" /> + <ngram occurrences="12" value="nyddi" /> + <ngram occurrences="12" value="n_d" /> + <ngram occurrences="12" value="n_a" /> + <ngram occurrences="12" value="id" /> + <ngram occurrences="12" value="eu_" /> + <ngram occurrences="12" value="es" /> + <ngram occurrences="12" value="dol_" /> + <ngram occurrences="12" value="dol" /> + <ngram occurrences="12" value="d_yn_" /> + <ngram occurrences="12" value="ar_" /> + <ngram occurrences="12" value="ad_" /> + <ngram occurrences="12" value="_ym" /> + <ngram occurrences="12" value="_iait" /> + <ngram occurrences="12" value="_iai" /> + <ngram occurrences="11" value="y_g" /> + <ngram occurrences="11" value="wydd_" /> + <ngram occurrences="11" value="rth" /> + <ngram occurrences="11" value="re" /> + <ngram occurrences="11" value="o_r_" /> + <ngram occurrences="11" value="li" /> + <ngram occurrences="11" value="ig" /> + <ngram occurrences="11" value="f_" /> + <ngram occurrences="11" value="ewn" /> + <ngram occurrences="11" value="ei_" /> + <ngram occurrences="11" value="dd_y" /> + <ngram occurrences="11" value="cym" /> + <ngram occurrences="11" value="aw" /> + <ngram occurrences="11" value="an_" /> + <ngram occurrences="11" value="_y_g" /> + <ngram occurrences="11" value="_t" /> + <ngram occurrences="11" value="_fe" /> + <ngram occurrences="11" value="_ei_" /> + <ngram occurrences="11" value="_cym" /> + <ngram occurrences="11" value="_ar_" /> + <ngram occurrences="10" value="yw" /> + <ngram occurrences="10" value="un" /> + <ngram occurrences="10" value="u_a" /> + <ngram occurrences="10" value="te" /> + <ngram occurrences="10" value="ry" /> + <ngram occurrences="10" value="r_gy" /> + <ngram occurrences="10" value="r_a" /> + <ngram occurrences="10" value="pa" /> + <ngram occurrences="10" value="on" /> + <ngram occurrences="10" value="l_i" /> + <ngram occurrences="10" value="i_d" /> + <ngram occurrences="10" value="hw" /> + <ngram occurrences="10" value="gr" /> + <ngram occurrences="10" value="fr" /> + <ngram occurrences="10" value="fo" /> + <ngram occurrences="10" value="dio" /> + <ngram occurrences="10" value="ddo" /> + <ngram occurrences="10" value="ddio" /> + <ngram occurrences="10" value="dda" /> + <ngram occurrences="10" value="cr" /> + <ngram occurrences="10" value="bl" /> + <ngram occurrences="10" value="af" /> + <ngram occurrences="10" value="ac_" /> + <ngram occurrences="10" value="_r_g" /> + <ngram occurrences="10" value="_dde" /> + <ngram occurrences="10" value="_ac" /> + <ngram occurrences="9" value="yddio" /> + <ngram occurrences="9" value="yd_" /> + <ngram occurrences="9" value="w_" /> + <ngram occurrences="9" value="u_r" /> + <ngram occurrences="9" value="st" /> + <ngram occurrences="9" value="sg" /> + <ngram occurrences="9" value="os" /> + <ngram occurrences="9" value="og" /> + <ngram occurrences="9" value="oedd_" /> + <ngram occurrences="9" value="od_" /> + <ngram occurrences="9" value="new" /> + <ngram occurrences="9" value="na" /> + <ngram occurrences="9" value="mewn_" /> + <ngram occurrences="9" value="mewn" /> + <ngram occurrences="9" value="mew" /> + <ngram occurrences="9" value="il" /> + <ngram occurrences="9" value="ig_" /> + <ngram occurrences="9" value="gwe" /> + <ngram occurrences="9" value="fy" /> + <ngram occurrences="9" value="fer" /> + <ngram occurrences="9" value="ewn_" /> + <ngram occurrences="9" value="edd_" /> + <ngram occurrences="9" value="dy" /> + <ngram occurrences="9" value="dr" /> + <ngram occurrences="9" value="dio_" /> + <ngram occurrences="9" value="ddio_" /> + <ngram occurrences="9" value="d_i" /> + <ngram occurrences="9" value="d_a" /> + <ngram occurrences="9" value="_sy" /> + <ngram occurrences="9" value="_si" /> + <ngram occurrences="9" value="_pa" /> + <ngram occurrences="9" value="_new" /> + <ngram occurrences="9" value="_mewn" /> + <ngram occurrences="9" value="_mew" /> + <ngram occurrences="9" value="_ma" /> + <ngram occurrences="9" value="_ga" /> + <ngram occurrences="9" value="_ac_" /> + <ngram occurrences="8" value="so" /> + <ngram occurrences="8" value="r_gym" /> + <ngram occurrences="8" value="par" /> + <ngram occurrences="8" value="or" /> + <ngram occurrences="8" value="nt_" /> + <ngram occurrences="8" value="my" /> + <ngram occurrences="8" value="ly" /> + <ngram occurrences="8" value="lw" /> + <ngram occurrences="8" value="l_i_" /> + <ngram occurrences="8" value="l_a" /> + <ngram occurrences="8" value="is" /> + <ngram occurrences="8" value="in" /> + <ngram occurrences="8" value="id_" /> + <ngram occurrences="8" value="iad" /> + <ngram occurrences="8" value="hr" /> + <ngram occurrences="8" value="he" /> + <ngram occurrences="8" value="ge" /> + <ngram occurrences="8" value="g_yn_" /> + <ngram occurrences="8" value="g_yn" /> + <ngram occurrences="8" value="eg_y" /> + <ngram occurrences="8" value="e_" /> + <ngram occurrences="8" value="dia" /> + <ngram occurrences="8" value="dd_yn" /> + <ngram occurrences="8" value="d_e" /> + <ngram occurrences="8" value="cyf" /> + <ngram occurrences="8" value="_rh" /> + <ngram occurrences="8" value="_gwe" /> + <ngram occurrences="8" value="_eu_" /> + <ngram occurrences="8" value="_eu" /> + <ngram occurrences="8" value="_cyf" /> + <ngram occurrences="7" value="yr_a" /> + <ngram occurrences="7" value="yg" /> + <ngram occurrences="7" value="yddo" /> + <ngram occurrences="7" value="ydd_y" /> + <ngram occurrences="7" value="y_n" /> + <ngram occurrences="7" value="y_gym" /> + <ngram occurrences="7" value="y_gy" /> + <ngram occurrences="7" value="y_c" /> + <ngram occurrences="7" value="u_y" /> + <ngram occurrences="7" value="u_r_" /> + <ngram occurrences="7" value="tr" /> + <ngram occurrences="7" value="ta" /> + <ngram occurrences="7" value="s_y" /> + <ngram occurrences="7" value="rw" /> + <ngram occurrences="7" value="rth_" /> + <ngram occurrences="7" value="rdd" /> + <ngram occurrences="7" value="r_i" /> + <ngram occurrences="7" value="r_ar" /> + <ngram occurrences="7" value="ol_a" /> + <ngram occurrences="7" value="odol_" /> + <ngram occurrences="7" value="odol" /> + <ngram occurrences="7" value="odo" /> + <ngram occurrences="7" value="odd" /> + <ngram occurrences="7" value="ob" /> + <ngram occurrences="7" value="o_a" /> + <ngram occurrences="7" value="nol" /> + <ngram occurrences="7" value="newyd" /> + <ngram occurrences="7" value="newy" /> + <ngram occurrences="7" value="n_h" /> + <ngram occurrences="7" value="n_g" /> + <ngram occurrences="7" value="n_f" /> + <ngram occurrences="7" value="n_c" /> + <ngram occurrences="7" value="m_" /> + <ngram occurrences="7" value="ll_" /> + <ngram occurrences="7" value="ic" /> + <ngram occurrences="7" value="iad_" /> + <ngram occurrences="7" value="i_g" /> + <ngram occurrences="7" value="han" /> + <ngram occurrences="7" value="gu" /> + <ngram occurrences="7" value="gan" /> + <ngram occurrences="7" value="fl" /> + <ngram occurrences="7" value="fer_" /> + <ngram occurrences="7" value="ewydd" /> + <ngram occurrences="7" value="ewyd" /> + <ngram occurrences="7" value="ewy" /> + <ngram occurrences="7" value="ent" /> + <ngram occurrences="7" value="du" /> + <ngram occurrences="7" value="di_" /> + <ngram occurrences="7" value="ddefn" /> +</ngrams>