blob: 8c08d68642a50b98a8c4145af262aeb392b3ad88 [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package examples;
import org.apache.jena.atlas.lib.StrUtils ;
import org.apache.jena.atlas.logging.LogCtl ;
import org.apache.jena.query.* ;
import org.apache.jena.query.text.EntityDefinition ;
import org.apache.jena.query.text.TextDatasetFactory ;
import org.apache.jena.query.text.TextIndexConfig;
import org.apache.jena.rdf.model.Model ;
import org.apache.jena.riot.RDFDataMgr ;
import org.apache.jena.sparql.util.QueryExecUtils ;
import org.apache.jena.vocabulary.RDFS ;
import org.apache.lucene.store.ByteBuffersDirectory;
import org.apache.lucene.store.Directory ;
import org.slf4j.Logger ;
import org.slf4j.LoggerFactory ;
/** Build a text search dataset */
public class JenaTextExample1
{
static { LogCtl.setLogging(); }
static Logger log = LoggerFactory.getLogger("JenaTextExample") ;
public static void main(String ... argv)
{
Dataset ds = createCode() ;
//Dataset ds = createAssembler() ;
loadData(ds , "data.ttl") ;
queryData(ds) ;
}
public static Dataset createCode()
{
log.info("Construct an in-memory dataset with in-memory lucene index using code") ;
// Build a text dataset by code.
// Here , in-memory base data and in-memeory Lucene index
// Base data
Dataset ds1 = DatasetFactory.create() ;
// Define the index mapping
EntityDefinition entDef = new EntityDefinition("uri", "text");
entDef.setPrimaryPredicate(RDFS.label.asNode());
// Lucene, in memory.
Directory dir = new ByteBuffersDirectory();
// Join together into a dataset
Dataset ds = TextDatasetFactory.createLucene(ds1, dir, new TextIndexConfig(entDef)) ;
return ds ;
}
public static Dataset createAssembler()
{
log.info("Construct text dataset using an assembler description") ;
// There are two datasets in the configuration:
// the one for the base data and one with text index.
// Therefore we need to name the dataset we are interested in.
Dataset ds = DatasetFactory.assemble("text-config.ttl", "http://localhost/jena_example/#text_dataset") ;
return ds ;
}
public static void loadData(Dataset dataset, String file)
{
log.info("Start loading") ;
long startTime = System.nanoTime() ;
dataset.begin(ReadWrite.WRITE) ;
try {
Model m = dataset.getDefaultModel() ;
RDFDataMgr.read(m, file) ;
dataset.commit() ;
} finally { dataset.end() ; }
long finishTime = System.nanoTime() ;
double time = (finishTime-startTime)/1.0e6 ;
log.info(String.format("Finish loading - %.2fms", time)) ;
}
public static void queryData(Dataset dataset)
{
log.info("START") ;
long startTime = System.nanoTime() ;
String pre = StrUtils.strjoinNL
( "PREFIX : <http://example/>"
, "PREFIX text: <http://jena.apache.org/text#>"
, "PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>") ;
String qs = StrUtils.strjoinNL
( "SELECT * "
, " { ?s text:query (rdfs:label 'X1') ;"
, " rdfs:label ?label"
, " }") ;
dataset.begin(ReadWrite.READ) ;
try {
Query q = QueryFactory.create(pre+"\n"+qs) ;
QueryExecution qexec = QueryExecutionFactory.create(q , dataset) ;
QueryExecUtils.executeQuery(q, qexec) ;
} finally { dataset.end() ; }
long finishTime = System.nanoTime() ;
double time = (finishTime-startTime)/1.0e6 ;
log.info(String.format("FINISH - %.2fms", time)) ;
}
}