| /* |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package org.apache.stanbol.enhancer.engines.langid.core; |
| |
| import static junit.framework.Assert.assertEquals; |
| import static org.junit.Assert.assertEquals; |
| import static org.junit.Assert.assertNotNull; |
| |
| import java.io.IOException; |
| import java.io.InputStream; |
| |
| import org.apache.commons.io.IOUtils; |
| import org.apache.tika.language.LanguageIdentifier; |
| import org.junit.BeforeClass; |
| import org.junit.Test; |
| |
| /** |
| * {@link LangIdTest} is a test class for {@link TextCategorizer}. |
| * |
| * @author Joerg Steffen, DFKI |
| * @version $Id$ |
| */ |
| public class LangIdTest { |
| |
| private static final String TEST_FILE_NAME = "en.txt"; |
| /** |
| * This contains the text used for testing |
| */ |
| private static String text; |
| /** |
| * This initializes the text categorizer. |
| */ |
| @BeforeClass |
| public static void oneTimeSetUp() throws IOException { |
| LanguageIdentifier.initProfiles(); |
| InputStream in = LangIdTest.class.getClassLoader().getResourceAsStream( |
| TEST_FILE_NAME); |
| assertNotNull("failed to load resource " + TEST_FILE_NAME, in); |
| text = IOUtils.toString(in); |
| } |
| |
| /** |
| * Tests the language identification. |
| * |
| * @throws IOException if there is an error when reading the text |
| */ |
| @Test |
| public void testLangId() throws IOException { |
| LanguageIdentifier tc = new LanguageIdentifier(text); |
| String language = tc.getLanguage(); |
| assertEquals("en", language); |
| } |
| } |