blob: 107b1901ff51c1d0ba26225a6c13067df0c71edb [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.metron.parsers.csv;
import static org.hamcrest.CoreMatchers.equalTo;
import static org.hamcrest.MatcherAssert.assertThat;
import static org.junit.jupiter.api.Assertions.assertEquals;
import static org.junit.jupiter.api.Assertions.assertNull;
import static org.junit.jupiter.api.Assertions.assertThrows;
import static org.junit.jupiter.api.Assertions.assertTrue;
import java.io.IOException;
import java.nio.charset.StandardCharsets;
import java.util.List;
import org.adrianwalker.multilinestring.Multiline;
import org.apache.hadoop.hbase.util.Bytes;
import org.apache.log4j.Level;
import org.apache.metron.common.configuration.SensorParserConfig;
import org.apache.metron.common.utils.JSONUtils;
import org.apache.metron.parsers.interfaces.MessageParser;
import org.apache.metron.test.utils.UnitTestHelper;
import org.json.simple.JSONObject;
import org.junit.jupiter.api.Test;
public class CSVParserTest {
/**
{
"parserClassName" : "org.apache.metron.parsers.csv.CSVParser"
,"sensorTopic":"dummy"
,"parserConfig":
{
"columns" : {
"col1" : 0
," col2" : 1
,"col3 " : 2
}
}
}
*/
@Multiline
public static String parserConfig;
@Test
public void test() throws IOException {
CSVParser parser = new CSVParser();
SensorParserConfig config = JSONUtils.INSTANCE.load(parserConfig, SensorParserConfig.class);
parser.init();
parser.configure(config.getParserConfig());
{
String line = "#foo,bar,grok";
assertEquals(0, parser.parse(Bytes.toBytes(line)).size());
}
{
String line = "";
assertEquals(0, parser.parse(Bytes.toBytes(line)).size());
}
{
String line = "foo,bar,grok";
List<JSONObject> results = parser.parse(Bytes.toBytes(line));
assertEquals(1, results.size());
JSONObject o = results.get(0);
assertTrue(parser.validate(o));
assertEquals(5, o.size());
assertEquals("foo", o.get("col1"));
assertEquals("bar", o.get("col2"));
assertEquals("grok", o.get("col3"));
}
{
String line = "\"foo\", \"bar\",\"grok\"";
List<JSONObject> results = parser.parse(Bytes.toBytes(line));
assertEquals(1, results.size());
JSONObject o = results.get(0);
assertTrue(parser.validate(o));
assertEquals(5, o.size());
assertEquals("foo", o.get("col1"));
assertEquals("bar", o.get("col2"));
assertEquals("grok", o.get("col3"));
}
{
String line = "foo, bar, grok";
List<JSONObject> results = parser.parse(Bytes.toBytes(line));
assertEquals(1, results.size());
JSONObject o = results.get(0);
assertTrue(parser.validate(o));
assertEquals(5, o.size());
assertEquals("foo", o.get("col1"));
assertEquals("bar", o.get("col2"));
assertEquals("grok", o.get("col3"));
}
{
String line = " foo , bar , grok ";
List<JSONObject> results = parser.parse(Bytes.toBytes(line));
assertEquals(1, results.size());
JSONObject o = results.get(0);
assertTrue(parser.validate(o));
assertEquals(5, o.size());
assertEquals("foo", o.get("col1"));
assertEquals("bar", o.get("col2"));
assertEquals("grok", o.get("col3"));
assertNull(o.get(" col2"));
assertNull(o.get("col3 "));
}
{
UnitTestHelper.setLog4jLevel(CSVParser.class, Level.FATAL);
String line = "foo";
assertThrows(IllegalStateException.class, () -> parser.parse(Bytes.toBytes(line)));
UnitTestHelper.setLog4jLevel(CSVParser.class, Level.ERROR);
}
}
@Test
public void getsReadCharsetFromConfig() throws IOException {
SensorParserConfig config = JSONUtils.INSTANCE.load(parserConfig, SensorParserConfig.class);
CSVParser parser = new CSVParser();
parser.init();
config.getParserConfig().put(MessageParser.READ_CHARSET, StandardCharsets.UTF_16.toString());
parser.configure(config.getParserConfig());
assertThat(parser.getReadCharset(), equalTo(StandardCharsets.UTF_16));
}
@Test
public void getsReadCharsetFromDefault() throws IOException {
SensorParserConfig config = JSONUtils.INSTANCE.load(parserConfig, SensorParserConfig.class);
CSVParser parser = new CSVParser();
parser.init();
parser.configure(config.getParserConfig());
assertThat(parser.getReadCharset(), equalTo(StandardCharsets.UTF_8));
}
}