blob: 5f849d6db1dd2f75323c2860b01841cd25f17ccb [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.jena.query.text;
import java.io.File ;
import java.io.Reader ;
import java.io.StringReader ;
import java.util.Arrays ;
import java.util.HashSet ;
import java.util.Set ;
import org.apache.jena.assembler.Assembler ;
import org.apache.jena.atlas.lib.StrUtils ;
import org.apache.jena.query.Dataset ;
import org.apache.jena.query.text.assembler.TextAssembler ;
import org.apache.jena.rdf.model.Model ;
import org.apache.jena.rdf.model.ModelFactory ;
import org.apache.jena.rdf.model.Resource ;
import org.junit.After ;
import org.junit.Before ;
import org.junit.Test ;
/**
* This class defines a setup configuration for a dataset that uses a simple analyzer with a Lucene index.
*/
public class TestDatasetWithSimpleAnalyzer extends AbstractTestDatasetWithTextIndexBase {
private static final String INDEX_PATH = "target/test/TestDatasetWithLuceneIndex";
private static final File indexDir = new File(INDEX_PATH);
private static final String SPEC_BASE = "http://example.org/spec#";
private static final String SPEC_ROOT_LOCAL = "lucene_text_dataset";
private static final String SPEC_ROOT_URI = SPEC_BASE + SPEC_ROOT_LOCAL;
private static final String SPEC;
static {
SPEC = StrUtils.strjoinNL(
"prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> ",
"prefix ja: <http://jena.hpl.hp.com/2005/11/Assembler#> ",
"prefix tdb: <http://jena.hpl.hp.com/2008/tdb#>",
"prefix text: <http://jena.apache.org/text#>",
"prefix : <" + SPEC_BASE + ">",
"",
"[] ja:loadClass \"org.apache.jena.query.text.TextQuery\" .",
"text:TextDataset rdfs:subClassOf ja:RDFDataset .",
"text:TextIndexLucene rdfs:subClassOf text:TextIndex .",
":" + SPEC_ROOT_LOCAL,
" a text:TextDataset ;",
" text:dataset :dataset ;",
" text:index :indexLucene ;",
" .",
"",
":dataset",
" a ja:RDFDataset ;",
" ja:defaultGraph :graph ;",
".",
":graph",
" a ja:MemoryModel ;",
".",
"",
":indexLucene",
" a text:TextIndexLucene ;",
" text:directory <file:" + INDEX_PATH + "> ;",
" text:entityMap :entMap ;",
" .",
"",
":entMap",
" a text:EntityMap ;",
" text:entityField \"uri\" ;",
" text:defaultField \"label\" ;",
" text:map (",
" [ text:field \"label\" ; ",
" text:predicate rdfs:label ;",
" text:analyzer [ a text:SimpleAnalyzer ]",
" ]",
" [ text:field \"comment\" ; text:predicate rdfs:comment ]",
" ) ."
);
}
public void init() {
Reader reader = new StringReader(SPEC);
Model specModel = ModelFactory.createDefaultModel();
specModel.read(reader, "", "TURTLE");
TextAssembler.init();
// deleteOldFiles();
indexDir.mkdirs();
Resource root = specModel.getResource(SPEC_ROOT_URI);
dataset = (Dataset) Assembler.general.open(root);
}
public void deleteOldFiles() {
dataset.close();
if (indexDir.exists()) TextSearchUtil.emptyAndDeleteDirectory(indexDir);
}
@Before
public void beforeClass() {
init();
}
@After
public void afterClass() {
deleteOldFiles();
}
@Test
public void testSimpleAnalyzer() {
final String turtle = StrUtils.strjoinNL(
TURTLE_PROLOG,
"<" + RESOURCE_BASE + "testSimpleAnalyzer>",
" rdfs:label 'bar the barfoo foo'",
"."
);
// the simple analyzer should not filter out the 'the' word
String queryString = StrUtils.strjoinNL(
QUERY_PROLOG,
"SELECT ?s",
"WHERE {",
" ?s text:query ( rdfs:label 'the' 10 ) .",
"}"
);
Set<String> expectedURIs = new HashSet<>() ;
expectedURIs.addAll( Arrays.asList("http://example.org/data/resource/testSimpleAnalyzer")) ;
doTestSearch(turtle, queryString, expectedURIs);
}
}