blob: 45cafbfd122baa597e56533288eadcc5db313f7e [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.jena.riot.lang;
import static org.apache.jena.riot.system.ErrorHandlerFactory.errorHandlerNoLogging ;
import static org.apache.jena.riot.system.ErrorHandlerFactory.getDefaultErrorHandler ;
import static org.apache.jena.riot.system.ErrorHandlerFactory.setDefaultErrorHandler ;
import static org.junit.Assert.assertEquals;
import java.io.ByteArrayInputStream ;
import org.apache.jena.atlas.lib.CharSpace ;
import org.apache.jena.atlas.lib.StrUtils ;
import org.apache.jena.irix.IRIs;
import org.apache.jena.riot.ErrorHandlerTestLib.ErrorHandlerEx;
import org.apache.jena.riot.ErrorHandlerTestLib.ExError;
import org.apache.jena.riot.ErrorHandlerTestLib.ExFatal;
import org.apache.jena.riot.ErrorHandlerTestLib.ExWarning;
import org.apache.jena.riot.Lang ;
import org.apache.jena.riot.RIOT;
import org.apache.jena.riot.system.*;
import org.apache.jena.riot.tokens.Tokenizer ;
import org.apache.jena.riot.tokens.TokenizerText;
import org.junit.AfterClass ;
import org.junit.BeforeClass ;
import org.junit.Test ;
/** Test of syntax by a tuples parser (does not include node validity checking) */
abstract public class AbstractTestLangNTuples
{
// Test streaming interface.
private static ErrorHandler errorhandler = null;
@BeforeClass
public static void beforeClass() {
errorhandler = getDefaultErrorHandler();
setDefaultErrorHandler(errorHandlerNoLogging);
}
@AfterClass
public static void afterClass() {
setDefaultErrorHandler(errorhandler);
}
@Test
public void tuple_0() {
long count = parseCount("");
assertEquals(0, count);
}
@Test
public void tuple_1() {
long count = parseCount("<x> <y> <z>.");
assertEquals(1, count);
}
@Test
public void tuple_2() {
long count = parseCount("<x> <y> \"z\".");
assertEquals(1, count);
}
@Test
public void tuple_3() {
long count = parseCount("<x> <y> <z>. <x> <y> <z>.");
assertEquals(2, count);
}
@Test
public void tuple_4() {
long count = parseCount("<x> <y> \"123\"^^<int>.");
assertEquals(1, count);
}
@Test
public void tuple_5() {
long count = parseCount("<x> <y> \"123\"@lang.");
assertEquals(1, count);
}
// Test parse errors interface.
@Test(expected = ExFatal.class)
public void tuple_bad_01() {
parseCount("<x> <y> <z>"); // No DOT
}
@Test(expected = ExFatal.class)
public void tuple_bad_02() {
parseCount("<x> _:a <z> ."); // Bad predicate
}
@Test(expected = ExFatal.class)
public void tuple_bad_03() {
parseCount("<x> \"p\" <z> ."); // Bad predicate
}
@Test(expected = ExFatal.class)
public void tuple_bad_4() {
parseCount("\"x\" <p> <z> ."); // Bad subject
}
@Test(expected = ExFatal.class)
public void tuple_bad_5() {
parseCount("<x> <p> ?var ."); // No variables
}
@Test(expected = ExFatal.class)
public void tuple_bad_6() {
parseCount("<x> <p> 123 ."); // No abbreviations.
}
@Test(expected = ExFatal.class)
public void tuple_bad_7() {
parseCount("<x> <p> x:y ."); // No prefixed names
}
// Bad terms - but accepted by default.
@Test(expected = ExError.class)
public void tuple_bad_10() {
parseCount("<x> <p> <bad uri> .");
}
// Bad terms (value range) - but legal syntax
@Test
public void tuple_bad_11() {
parseCount("<x> <p> \"9000\"^^<http://www.w3.org/2001/XMLSchema#byte> .");
}
// Bad - relative URI.
@Test(expected = ExError.class)
public void tuple_bad_21() {
parseCheck("<x> <p> <z> .");
}
// Bad terms
@Test(expected = ExFatal.class)
public void tuple_bad_22() {
parseCheck("<http://example/x> <http://example/p> \"abc\"^^<http://example/bad uri> .");
}
@Test(expected = ExWarning.class)
public void tuple_bad_23() {
parseCheck("<http://example/x> <http://example/p> \"9000\"^^<http://www.w3.org/2001/XMLSchema#byte> .");
}
// ASCII vs UTF-8
@Test
public void tuple_charset_1() {
// E9 is e-acute
parseCheck("<http://example/x\\u00E9> <http://example/p> <http://example/s> .");
}
@Test
public void tuple_charset_2() {
parseCheck("<http://example/é> <http://example/p> \"é\" .");
}
static protected Tokenizer tokenizer(CharSpace charSpace, String string) {
byte b[] = StrUtils.asUTF8bytes(string);
ByteArrayInputStream in = new ByteArrayInputStream(b);
Tokenizer tokenizer = charSpace == CharSpace.ASCII
? TokenizerText.create().asciiOnly(true).source(in).build()
: TokenizerText.create().source(in).build();
return tokenizer;
}
static protected Tokenizer tokenizer(String string) {
// UTF-8
byte b[] = StrUtils.asUTF8bytes(string);
ByteArrayInputStream in = new ByteArrayInputStream(b);
Tokenizer tokenizer = TokenizerText.create().source(in).build() ;
return tokenizer;
}
final protected void parseCheck(String... strings) {
String string = String.join("\n", strings);
Tokenizer tokenizer = tokenizer(string);
StreamRDFCounting sink = StreamRDFLib.count();
LangRIOT x = RiotParsers.createParserNQuads(tokenizer, sink, parserProfile(new ErrorHandlerEx()));
x.parse();
}
final protected long parseCount(CharSpace charSpace, String... strings) {
String string = String.join("\n", strings);
Tokenizer tokenizer = tokenizer(charSpace, string);
StreamRDFCounting sink = StreamRDFLib.count();
LangRIOT x = RiotParsers.createParserNTriples(tokenizer, sink, parserProfile(new ErrorHandlerEx()));
x.parse();
return sink.count();
}
/** Create a {@link ParserProfile}, no resolving, no prefix map. */
static ParserProfile parserProfile(ErrorHandler errorHandler) {
return new ParserProfileStd(RiotLib.factoryRDF(),
errorHandler,
IRIs.absoluteResolver(),
PrefixMapFactory.emptyPrefixMap(),
RIOT.getContext().copy(),
true, false) ;
}
protected abstract Lang getLang();
protected long parseCount(String... strings) {
return ParserTestBaseLib.parseCount(getLang(), strings);
}
}