| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118 |
- # Copyright (c) 2003, WiseGuys Internet B.V.
- #
- # All rights reserved.
- #
- # Redistribution and use in source and binary forms, with or without
- # modification, are permitted provided that the following conditions are
- # met:
- #
- # - Redistributions of source code must retain the above copyright
- # notice, this list of conditions and the following disclaimer.
- #
- # - Redistributions in binary form must reproduce the above copyright
- # notice, this list of conditions and the following disclaimer in the
- # documentation and/or other materials provided with the distribution.
- #
- # - Neither the name of the WiseGuys Internet B.V. nor the names of its
- # contributors may be used to endorse or promote products derived from
- # this software without specific prior written permission.
- #
- # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
- # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
- # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
- # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
- # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- #
- # A sample config file for the language models
- # provided with Gertjan van Noords language guesser
- # (http://odur.let.rug.nl/~vannoord/TextCat/)
- #
- # Notes:
- # - You may consider eliminating a couple of small languages from this
- # list because they cause false positives with big languages and are
- # bad for performance. (Do you really want to recognize Drents?)
- # - Putting the most probable languages at the top of the list
- # improves performance, because this will raise the threshold for
- # likely candidates more quickly.
- #
- # this file have been modified (to OOo by Jocelyn MERAND
- # joc.merATgmail.com) to include country and encoding
- # guess strings are made as following : language-country-encoding
- afrikaans.lm af--utf8
- albanian.lm sq--utf8
- amharic_utf.lm am--utf8
- arabic.lm ar--utf8
- basque.lm eu--utf8
- belarus.lm be--utf8
- bosnian.lm bs--utf8
- breton.lm br--utf8
- catalan.lm ca--utf8
- chinese_simplified.lm zh-CN-utf8
- chinese_traditional.lm zh-TW-utf8
- croatian.lm hr--utf8
- czech.lm cs--utf8
- danish.lm da--utf8
- dutch.lm nl--utf8
- english.lm en--utf8
- esperanto.lm eo--utf8
- estonian.lm et--utf8
- finnish.lm fi--utf8
- french.lm fr--utf8
- frisian.lm fy--utf8
- georgian.lm ka--utf8
- german.lm de--utf8
- greek.lm el--utf8
- hebrew.lm he--utf8
- hindi.lm hi--utf8
- hungarian.lm hu--utf8
- icelandic.lm is--utf8
- indonesian.lm id--utf8
- irish_gaelic.lm ga--utf8
- italian.lm it--utf8
- japanese.lm ja--utf8
- korean.lm ko--utf8
- latin.lm la--utf8
- latvian.lm lv--utf8
- lithuanian.lm lt--utf8
- luxembourgish.lm lb--utf8
- malay.lm ms--utf8
- manx_gaelic.lm gv--utf8
- marathi.lm mr--utf8
- mongolian_cyrillic.lm mn--utf8
- nepali.lm ne--utf8
- norwegian.lm nb--utf8 # Norwegian (Bokmal)
- persian.lm fa--utf8 # Farsi
- polish.lm pl--utf8
- portuguese.lm pt-PT-utf8
- quechua.lm qu--utf8
- romanian.lm ro--utf8
- romansh.lm rm--utf8
- russian.lm ru--utf8
- sanskrit.lm sa--utf8
- scots.lm sco--utf8
- scots_gaelic.lm gd--utf8
- serbian.lm sr--utf-8
- serbian-latin.lm sh--utf-8
- slovak_ascii.lm sk-SK-utf8
- slovenian.lm sl--utf8
- spanish.lm es--utf8
- swahili.lm sw--utf8
- swedish.lm sv--utf8
- tagalog.lm tl--utf8
- tamil.lm ta--utf8
- thai.lm th--utf8
- turkish.lm tr--utf8
- ukrainian.lm uk--utf8
- vietnamese.lm vi--utf8
- welsh.lm cy--utf8
- yiddish_utf.lm yi--utf8
- zulu.lm zu--utf8
|