| # Copyright (c) 2003, WiseGuys Internet B.V. |
| # |
| # All rights reserved. |
| # |
| # Redistribution and use in source and binary forms, with or without |
| # modification, are permitted provided that the following conditions are |
| # met: |
| # |
| # - Redistributions of source code must retain the above copyright |
| # notice, this list of conditions and the following disclaimer. |
| # |
| # - Redistributions in binary form must reproduce the above copyright |
| # notice, this list of conditions and the following disclaimer in the |
| # documentation and/or other materials provided with the distribution. |
| # |
| # - Neither the name of the WiseGuys Internet B.V. nor the names of its |
| # contributors may be used to endorse or promote products derived from |
| # this software without specific prior written permission. |
| # |
| # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| # |
| |
| # A sample config file for the language models |
| # provided with Gertjan van Noords language guesser |
| # (http://odur.let.rug.nl/~vannoord/TextCat/) |
| # |
| # Notes: |
| # - You may consider eliminating a couple of small languages from this |
| # list because they cause false positives with big languages and are |
| # bad for performance. (Do you really want to recognize Drents?) |
| # - Putting the most probable languages at the top of the list |
| # improves performance, because this will raise the threshold for |
| # likely candidates more quickly. |
| # |
| |
| # this file have been modified (to OOo by Jocelyn MERAND |
| # joc.merATgmail.com) to include country and encoding |
| # guess strings are made as following : language-country-encoding |
| |
| afrikaans.lm af--utf8 |
| albanian.lm sq--utf8 |
| amharic_utf.lm am--utf8 |
| arabic.lm ar--utf8 |
| basque.lm eu--utf8 |
| belarus.lm be--utf8 |
| bosnian.lm bs--utf8 |
| breton.lm br--utf8 |
| catalan.lm ca--utf8 |
| chinese_simplified.lm zh-CN-utf8 |
| chinese_traditional.lm zh-TW-utf8 |
| croatian.lm hr--utf8 |
| czech.lm cs--utf8 |
| danish.lm da--utf8 |
| dutch.lm nl--utf8 |
| english.lm en--utf8 |
| esperanto.lm eo--utf8 |
| estonian.lm et--utf8 |
| finnish.lm fi--utf8 |
| french.lm fr--utf8 |
| frisian.lm fy--utf8 |
| georgian.lm ka--utf8 |
| german.lm de--utf8 |
| greek.lm el--utf8 |
| hebrew.lm he--utf8 |
| hindi.lm hi--utf8 |
| hungarian.lm hu--utf8 |
| icelandic.lm is--utf8 |
| indonesian.lm id--utf8 |
| irish_gaelic.lm ga--utf8 |
| italian.lm it--utf8 |
| japanese.lm ja--utf8 |
| korean.lm ko--utf8 |
| latin.lm la--utf8 |
| latvian.lm lv--utf8 |
| lithuanian.lm lt--utf8 |
| luxembourgish.lm lb--utf8 |
| malay.lm ms--utf8 |
| manx_gaelic.lm gv--utf8 |
| marathi.lm mr--utf8 |
| mongolian_cyrillic.lm mn--utf8 |
| nepali.lm ne--utf8 |
| norwegian.lm nb--utf8 # Norwegian (Bokmal) |
| persian.lm fa--utf8 # Farsi |
| polish.lm pl--utf8 |
| portuguese.lm pt-PT-utf8 |
| quechua.lm qu--utf8 |
| romanian.lm ro--utf8 |
| romansh.lm rm--utf8 |
| russian.lm ru--utf8 |
| sanskrit.lm sa--utf8 |
| scots.lm sco--utf8 |
| scots_gaelic.lm gd--utf8 |
| serbian.lm sr--utf-8 |
| serbian-latin.lm sh--utf-8 |
| slovak_ascii.lm sk-SK-utf8 |
| slovenian.lm sl--utf8 |
| spanish.lm es--utf8 |
| swahili.lm sw--utf8 |
| swedish.lm sv--utf8 |
| tagalog.lm tl--utf8 |
| tamil.lm ta--utf8 |
| thai.lm th--utf8 |
| turkish.lm tr--utf8 |
| ukrainian.lm uk--utf8 |
| vietnamese.lm vi--utf8 |
| welsh.lm cy--utf8 |
| yiddish_utf.lm yi--utf8 |
| zulu.lm zu--utf8 |