blob: 18ca861937190df881551f82ad7a7e3e463b05c5 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.exec.store.easy.json.loader;
import static org.junit.Assert.assertNotNull;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;
import java.nio.charset.StandardCharsets;
import java.time.Instant;
import java.time.LocalDate;
import java.time.LocalDateTime;
import java.time.LocalTime;
import java.time.ZoneId;
import java.time.format.DateTimeFormatter;
import java.util.TimeZone;
import static org.apache.drill.test.rowSet.RowSetUtilities.dec;
import static org.apache.drill.test.rowSet.RowSetUtilities.mapValue;
import static org.apache.drill.test.rowSet.RowSetUtilities.longArray;
import static org.apache.drill.test.rowSet.RowSetUtilities.intArray;
import static org.apache.drill.test.rowSet.RowSetUtilities.decArray;
import static org.apache.drill.test.rowSet.RowSetUtilities.doubleArray;
import static org.apache.drill.test.rowSet.RowSetUtilities.binArray;
import static org.apache.drill.test.rowSet.RowSetUtilities.strArray;
import static org.apache.drill.test.rowSet.RowSetUtilities.objArray;
import org.apache.drill.categories.JsonTest;
import org.apache.drill.common.exceptions.UserException;
import org.apache.drill.common.types.TypeProtos.MinorType;
import org.apache.drill.exec.physical.rowSet.RowSet;
import org.apache.drill.exec.record.metadata.SchemaBuilder;
import org.apache.drill.exec.record.metadata.TupleMetadata;
import org.apache.drill.test.rowSet.RowSetUtilities;
import org.junit.Test;
import org.junit.experimental.categories.Category;
@Category(JsonTest.class)
public class TestExtendedArrays extends BaseJsonLoaderTest {
@Test
public void testInt() {
String json =
"{ a: [ { \"$numberInt\": 10 }, 20, { \"$numberInt\": \"30\" } ] }\n" +
"{ a: null }\n" +
"{ a: [] }\n" +
"{ a: [ { \"$numberInt\": 40 }, \"50\", null ] }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addArray("a", MinorType.INT)
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(intArray(10, 20, 30))
.addSingleCol(intArray())
.addSingleCol(intArray())
.addSingleCol(intArray(40, 50, 0))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
@Test
public void testLong() {
String json =
"{ a: [ { \"$numberLong\": 10 }, 20, { \"$numberLong\": \"30\" } ] }\n" +
"{ a: null }\n" +
"{ a: [] }\n" +
"{ a: [ { \"$numberLong\": 40 }, \"50\", null ] }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addArray("a", MinorType.BIGINT)
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(longArray(10L, 20L, 30L))
.addSingleCol(longArray())
.addSingleCol(longArray())
.addSingleCol(longArray(40L, 50L, 0L))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
@Test
public void testDecimal() {
String json =
"{ a: [ { \"$numberDecimal\": 10 }, null, { \"$numberDecimal\": \"30\" }, " +
" { \"$numberDecimal\": 40.2345 } ] }\n" +
"{ a: null }\n" +
"{ a: [] }\n" +
"{ a: [ 60, \"70.890\", 80.765 ] }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addArray("a", MinorType.VARDECIMAL, 38, 10)
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(decArray(dec("10"), dec("0"), dec("30"), dec("40.2345")))
.addSingleCol(decArray())
.addSingleCol(decArray())
.addSingleCol(decArray(dec("60"), dec("70.89"), dec("80.765")))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
@Test
public void testDouble() {
String json =
"{ a: [ { \"$numberDouble\": 10 }, null, { \"$numberDouble\": \"30\" } ] }\n" +
"{ a: null }\n" +
"{ a: [] }\n" +
"{ a: [ { \"$numberDouble\": 40.125 }, 60, \"70.125\", 80.375 ] }\n" +
"{ a: [ { \"$numberDouble\": \"-Infinity\" }, " +
" { \"$numberDouble\": \"Infinity\" }," +
" { \"$numberDouble\": \"NaN\" } ] }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addArray("a", MinorType.FLOAT8)
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(doubleArray(10D, 0D, 30D))
.addSingleCol(doubleArray())
.addSingleCol(doubleArray())
.addSingleCol(doubleArray(40.125D, 60D, 70.125D, 80.375D))
.addSingleCol(doubleArray(Double.NEGATIVE_INFINITY, Double.POSITIVE_INFINITY, Double.NaN))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
@Test
public void testDate() {
LocalDateTime local = LocalDateTime.of(2020, 4, 21, 11, 22, 33);
Instant instant = local.atZone(ZoneId.systemDefault()).toInstant();
long ts = instant.toEpochMilli();
String utc = DateTimeFormatter.ISO_INSTANT.format(instant);
long localTs = ts + TimeZone.getDefault().getOffset(ts);
String json =
// V1 string, V2 relaxed
"{ a: [ { \"$date\": \"" + utc + "\" },\n" +
// V1 "shell mode"
" { \"$date\": " + ts + " } ] }\n" +
"{ a: null }\n" +
"{ a: [] }\n" +
// V2 canonical
"{ a: [ { \"$date\": { \"$numberLong\": " + ts + " } },\n" +
// Harmless extensions, only valid after the above
" " + ts + ",\n" +
" \"" + utc + "\" ] }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addArray("a", MinorType.TIMESTAMP)
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(longArray(localTs, localTs))
.addSingleCol(longArray())
.addSingleCol(longArray())
.addSingleCol(longArray(localTs, localTs, localTs))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
@Test
public void testDateNull() {
LocalDateTime local = LocalDateTime.of(2020, 4, 21, 11, 22, 33);
Instant instant = local.atZone(ZoneId.systemDefault()).toInstant();
String utc = DateTimeFormatter.ISO_INSTANT.format(instant);
String json =
"{ a: [ { \"$date\": \"" + utc + "\" }, null ] }\n";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
try {
loader.next();
fail();
} catch (UserException e) {
assertTrue(e.getMessage().contains("does not allow null values"));
}
loader.close();
}
@Test
public void testBinary() {
String json =
// V2 format
"{ a: [ { \"$binary\": { base64: \"ZHJpbGw=\", subType: \"0\" } },\n" +
" { \"$binary\": { subType: \"0\", base64: \"ZHJpbGw=\" } },\n" +
// Harmless extension
" { \"$binary\": { base64: \"ZHJpbGw=\" } }, null ] }\n" +
"{ a: null }\n" +
"{ a: [] }\n" +
// V1 format
"{ a: [ { \"$binary\": \"ZHJpbGw=\", \"$type\": 1 },\n" +
// Harmless extension
" { \"$binary\": \"ZHJpbGw=\" },\n" +
// Only valid after the above
" \"ZHJpbGw=\" ] }\n";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addArray("a", MinorType.VARBINARY)
.build();
byte[] bytes = "Drill".getBytes(StandardCharsets.UTF_8);
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(binArray(bytes, bytes, bytes, new byte[] { }))
.addSingleCol(binArray())
.addSingleCol(binArray())
.addSingleCol(binArray(bytes, bytes, bytes))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
@Test
public void testObjectID() {
String json =
"{ a: [ { \"$oid\": \"foo\" },\n" +
// Harmless extension. A Real OID can't be a "blank"
// value, but here we just store it as a string.
" null ] }\n" +
"{ a: null }\n" +
"{ a: [] }\n" +
// Only valid after the above
"{ a: [ \"foo\" ] }\n";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addArray("a", MinorType.VARCHAR)
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(strArray("foo", ""))
.addSingleCol(strArray())
.addSingleCol(strArray())
.addSingleCol(strArray("foo"))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
// A Mongo document is just a regular JSON map.
@Test
public void testDocument() {
String json =
"{ m: [ { a: { \"$numberLong\": 10 }, b: \"foo\" },\n" +
" { a: { \"$numberLong\": \"20\" }, b: null },\n" +
" { a: 30 } ] }\n" +
// Harmless extension
"{ m: null }\n" +
"{ m: [] }\n" +
"{ m: [ null, { a: { \"$numberLong\": 40 }, b: \"bar\" } ] }\n";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addMapArray("m")
.addNullable("a", MinorType.BIGINT)
.addNullable("b", MinorType.VARCHAR)
.resumeSchema()
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(objArray(mapValue(10L, "foo"),
mapValue(20L, null), mapValue(30L, null)))
.addSingleCol(objArray())
.addSingleCol(objArray())
.addSingleCol(objArray(mapValue(null, null), mapValue(40L, "bar")))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
// Drill extension: date only
@Test
public void testDateDay() {
String json =
"{ a: { \"$dateDay\": \"2020-04-21\" } }\n" +
"{ a: null }\n" +
"{ a: \"2020-04-21\" }\n";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addNullable("a", MinorType.DATE)
.build();
LocalDate date = LocalDate.of(2020, 04, 21);
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addRow(date)
.addSingleCol(null)
.addRow(date)
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
// Drill extension: time only
@Test
public void testTime() {
String json =
"{ a: { \"$time\": \"11:22:33\" } }\n" +
"{ a: null }\n" +
"{ a: \"11:22:33\" }\n";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addNullable("a", MinorType.TIME)
.build();
LocalTime time = LocalTime.of(11, 22, 33);
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addRow(time)
.addSingleCol(null)
.addRow(time)
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
// Drill extension: time interval
@Test
public void testInterval() {
String json =
"{ a: { \"$interval\": \"P1Y2M3DT4H5M6S\" } }\n" +
"{ a: { \"$interval\": \"P1Y2M3D\" } }\n" +
"{ a: { \"$interval\": \"PT4H5M6S\" } }\n" +
"{ a: null }\n" +
"{ a: \"P1Y2M3DT4H5M6S\" }\n" +
"{ a: \"P1Y2M3D\" }\n" +
"{ a: \"PT4H5M6S\" }\n";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addNullable("a", MinorType.INTERVAL)
.build();
org.joda.time.Period full = org.joda.time.Period.years(1).withMonths(2).withDays(3).withHours(4).withMinutes(5).withSeconds(6);
org.joda.time.Period ymd = org.joda.time.Period.years(1).withMonths(2).withDays(3);
org.joda.time.Period hms = org.joda.time.Period.hours(4).withMinutes(5).withSeconds(6);
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addRow(full)
.addRow(ymd)
.addRow(hms)
.addSingleCol(null)
.addRow(full)
.addRow(ymd)
.addRow(hms)
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
@Test
public void testNonExtended() {
String json =
"{ a: 10, b: { }, c: { d: 30 } }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addNullable("a", MinorType.BIGINT)
.addMap("b")
.resumeSchema()
.addMap("c")
.addNullable("d", MinorType.BIGINT)
.resumeSchema()
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addRow(10, mapValue(), mapValue(30))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
@Test
public void testUnknownType() {
String json =
"{ a: { \"$bogus\": 10 } }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
RowSet results = loader.next();
assertNotNull(results);
TupleMetadata expectedSchema = new SchemaBuilder()
.addMap("a")
.addNullable("$bogus", MinorType.BIGINT)
.resumeSchema()
.build();
RowSet expected = fixture.rowSetBuilder(expectedSchema)
.addSingleCol(mapValue(10))
.build();
RowSetUtilities.verify(expected, results);
assertNull(loader.next());
loader.close();
}
private final String LONG_HINT = "<{\"$numberLong\": scalar}>";
@Test
public void testInvalidTypeToken() {
String json =
"{ a: { \"$numberLong\": 10 } }\n" +
"{ a: [ ] }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
try {
loader.next();
fail();
} catch (UserException e) {
assertTrue(e.getMessage().contains(LONG_HINT));
}
loader.close();
}
@Test
public void testInvalidTypeObject() {
String json =
"{ a: { \"$numberLong\": 10 } }\n" +
"{ a: { } }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
try {
loader.next();
fail();
} catch (UserException e) {
assertTrue(e.getMessage().contains(LONG_HINT));
}
loader.close();
}
@Test
public void testInvalidTypeName() {
String json =
"{ a: { \"$numberLong\": 10 } }\n" +
"{ a: { \"$bogus\": 20 } }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
try {
loader.next();
fail();
} catch (UserException e) {
assertTrue(e.getMessage().contains(LONG_HINT));
}
loader.close();
}
@Test
public void testInvalidValueToken() {
String json =
"{ a: { \"$numberLong\": 10 } }\n" +
"{ a: { \"$numberLong\": [ ] } }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
try {
loader.next();
fail();
} catch (UserException e) {
assertTrue(e.getMessage().contains(LONG_HINT));
}
loader.close();
}
@Test
public void testInvalidValue() {
String json =
"{ a: { \"$numberLong\": 10 } }\n" +
"{ a: { \"$numberLong\": 20.3 } }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
try {
loader.next();
fail();
} catch (UserException e) {
assertTrue(e.getMessage().contains("Unexpected JSON value: VALUE_NUMBER_FLOAT"));
}
loader.close();
}
@Test
public void testExtraField() {
String json =
"{ a: { \"$numberLong\": 10 } }\n" +
"{ a: { \"$numberLong\": 20, bogus: 30 } }";
JsonLoaderFixture loader = new JsonLoaderFixture();
loader.jsonOptions.enableExtendedTypes = true;
loader.open(json);
try {
loader.next();
fail();
} catch (UserException e) {
assertTrue(e.getMessage().contains(LONG_HINT));
}
loader.close();
}
}