| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| package org.apache.rya.indexing.pcj.fluo.integration; |
| |
| import static org.junit.Assert.assertEquals; |
| import static org.junit.Assert.assertFalse; |
| |
| import java.util.HashSet; |
| import java.util.Set; |
| |
| import org.apache.accumulo.core.client.Connector; |
| import org.apache.fluo.api.client.FluoClient; |
| import org.apache.fluo.api.client.FluoFactory; |
| import org.apache.rya.api.domain.RyaStatement; |
| import org.apache.rya.api.domain.RyaURI; |
| import org.apache.rya.api.utils.CloseableIterator; |
| import org.apache.rya.indexing.pcj.fluo.api.CreateFluoPcj; |
| import org.apache.rya.indexing.pcj.fluo.api.InsertTriples; |
| import org.apache.rya.indexing.pcj.storage.PrecomputedJoinStorage; |
| import org.apache.rya.indexing.pcj.storage.accumulo.AccumuloPcjStorage; |
| import org.apache.rya.pcj.fluo.test.base.RyaExportITBase; |
| import org.junit.Test; |
| import org.openrdf.model.Statement; |
| import org.openrdf.model.ValueFactory; |
| import org.openrdf.model.impl.ValueFactoryImpl; |
| import org.openrdf.query.BindingSet; |
| import org.openrdf.query.impl.MapBindingSet; |
| import org.openrdf.repository.sail.SailRepositoryConnection; |
| |
| import com.google.common.base.Optional; |
| import com.google.common.collect.Sets; |
| |
| /** |
| * Performs integration tests over the Fluo application geared towards various types of input. |
| */ |
| public class InputIT extends RyaExportITBase { |
| |
| /** |
| * Ensure historic matches are included in the result. |
| */ |
| @Test |
| public void historicResults() throws Exception { |
| // A query that finds people who talk to Eve and work at Chipotle. |
| final String sparql = |
| "SELECT ?x WHERE { " + |
| "?x <http://talksTo> <http://Eve>. " + |
| "?x <http://worksAt> <http://Chipotle>." + |
| "}"; |
| |
| // Triples that are loaded into Rya before the PCJ is created. |
| final ValueFactory vf = new ValueFactoryImpl(); |
| final Set<Statement> historicTriples = Sets.newHashSet( |
| vf.createStatement(vf.createURI("http://Alice"), vf.createURI("http://talksTo"), vf.createURI("http://Eve")), |
| vf.createStatement(vf.createURI("http://Bob"), vf.createURI("http://talksTo"), vf.createURI("http://Eve")), |
| vf.createStatement(vf.createURI("http://Charlie"), vf.createURI("http://talksTo"), vf.createURI("http://Eve")), |
| |
| vf.createStatement(vf.createURI("http://Eve"), vf.createURI("http://helps"), vf.createURI("http://Kevin")), |
| |
| vf.createStatement(vf.createURI("http://Bob"), vf.createURI("http://worksAt"), vf.createURI("http://Chipotle")), |
| vf.createStatement(vf.createURI("http://Charlie"), vf.createURI("http://worksAt"), vf.createURI("http://Chipotle")), |
| vf.createStatement(vf.createURI("http://Eve"), vf.createURI("http://worksAt"), vf.createURI("http://Chipotle")), |
| vf.createStatement(vf.createURI("http://David"), vf.createURI("http://worksAt"), vf.createURI("http://Chipotle"))); |
| |
| // The expected results of the SPARQL query once the PCJ has been computed. |
| final Set<BindingSet> expected = new HashSet<>(); |
| |
| MapBindingSet bs = new MapBindingSet(); |
| bs.addBinding("x", vf.createURI("http://Bob")); |
| expected.add(bs); |
| |
| bs = new MapBindingSet(); |
| bs.addBinding("x", vf.createURI("http://Charlie")); |
| expected.add(bs); |
| |
| // Load the historic data into Rya. |
| final SailRepositoryConnection ryaConn = super.getRyaSailRepository().getConnection(); |
| for(final Statement triple : historicTriples) { |
| ryaConn.add(triple); |
| } |
| ryaConn.close(); |
| |
| // Create the PCJ table. |
| final Connector accumuloConn = super.getAccumuloConnector(); |
| final PrecomputedJoinStorage pcjStorage = new AccumuloPcjStorage(accumuloConn, getRyaInstanceName()); |
| final String pcjId = pcjStorage.createPcj(sparql); |
| |
| try(FluoClient fluoClient = FluoFactory.newClient(super.getFluoConfiguration())) { |
| // Tell the Fluo app to maintain the PCJ. |
| new CreateFluoPcj().withRyaIntegration(pcjId, pcjStorage, fluoClient, accumuloConn, getRyaInstanceName()); |
| |
| // Verify the end results of the query match the expected results. |
| super.getMiniFluo().waitForObservers(); |
| |
| final Set<BindingSet> results = new HashSet<>(); |
| try(CloseableIterator<BindingSet> resultsIt = pcjStorage.listResults(pcjId)) { |
| while(resultsIt.hasNext()) { |
| results.add( resultsIt.next() ); |
| } |
| } |
| |
| assertEquals(expected, results); |
| } |
| } |
| |
| /** |
| * Ensure streamed matches are included in the result. |
| */ |
| @Test |
| public void streamedResults() throws Exception { |
| // A query that finds people who talk to Eve and work at Chipotle. |
| final String sparql = |
| "SELECT ?x WHERE { " + |
| "?x <http://talksTo> <http://Eve>. " + |
| "?x <http://worksAt> <http://Chipotle>." + |
| "}"; |
| |
| // Triples that will be streamed into Fluo after the PCJ has been created. |
| final Set<RyaStatement> streamedTriples = Sets.newHashSet( |
| new RyaStatement(new RyaURI("http://Alice"), new RyaURI("http://talksTo"), new RyaURI("http://Eve")), |
| new RyaStatement(new RyaURI("http://Bob"), new RyaURI("http://talksTo"), new RyaURI("http://Eve")), |
| new RyaStatement(new RyaURI("http://Charlie"), new RyaURI("http://talksTo"), new RyaURI("http://Eve")), |
| |
| new RyaStatement(new RyaURI("http://Eve"), new RyaURI("http://helps"), new RyaURI("http://Kevin")), |
| |
| new RyaStatement(new RyaURI("http://Bob"), new RyaURI("http://worksAt"), new RyaURI("http://Chipotle")), |
| new RyaStatement(new RyaURI("http://Charlie"), new RyaURI("http://worksAt"), new RyaURI("http://Chipotle")), |
| new RyaStatement(new RyaURI("http://Eve"), new RyaURI("http://worksAt"), new RyaURI("http://Chipotle")), |
| new RyaStatement(new RyaURI("http://David"), new RyaURI("http://worksAt"), new RyaURI("http://Chipotle"))); |
| |
| // The expected results of the SPARQL query once the PCJ has been computed. |
| final ValueFactory vf = new ValueFactoryImpl(); |
| final Set<BindingSet> expected = new HashSet<>(); |
| |
| MapBindingSet bs = new MapBindingSet(); |
| bs.addBinding("x", vf.createURI("http://Bob")); |
| expected.add(bs); |
| |
| bs = new MapBindingSet(); |
| bs.addBinding("x", vf.createURI("http://Charlie")); |
| expected.add(bs); |
| |
| // Create the PCJ table. |
| final Connector accumuloConn = super.getAccumuloConnector(); |
| final PrecomputedJoinStorage pcjStorage = new AccumuloPcjStorage(accumuloConn, getRyaInstanceName()); |
| final String pcjId = pcjStorage.createPcj(sparql); |
| |
| try(FluoClient fluoClient = FluoFactory.newClient(super.getFluoConfiguration())) { |
| // Tell the Fluo app to maintain the PCJ. |
| new CreateFluoPcj().withRyaIntegration(pcjId, pcjStorage, fluoClient, accumuloConn, getRyaInstanceName()); |
| |
| // Ensure the query has no results yet. |
| super.getMiniFluo().waitForObservers(); |
| |
| try(CloseableIterator<BindingSet> resultsIt = pcjStorage.listResults(pcjId)) { |
| assertFalse( resultsIt.hasNext() ); |
| } |
| |
| // Stream the data into Fluo. |
| new InsertTriples().insert(fluoClient, streamedTriples, Optional.<String>absent()); |
| |
| // Verify the end results of the query match the expected results. |
| super.getMiniFluo().waitForObservers(); |
| |
| final HashSet<BindingSet> results = new HashSet<>(); |
| try(CloseableIterator<BindingSet> resultsIt = pcjStorage.listResults(pcjId)) { |
| while(resultsIt.hasNext()) { |
| results.add( resultsIt.next() ); |
| } |
| } |
| |
| assertEquals(expected, results); |
| } |
| } |
| |
| /** |
| * Simulates the case where a Triple is added to Rya, a new query that includes |
| * that triple as a historic match is inserted into Fluo, and then some new |
| * triple that matches the query is streamed into Fluo. The query's results |
| * must include both the historic result and the newly streamed result. |
| */ |
| @Test |
| public void historicThenStreamedResults() throws Exception { |
| // A query that finds people who talk to Eve and work at Chipotle. |
| final String sparql = |
| "SELECT ?x WHERE { " + |
| "?x <http://talksTo> <http://Eve>. " + |
| "?x <http://worksAt> <http://Chipotle>." + |
| "}"; |
| |
| // Triples that are loaded into Rya before the PCJ is created. |
| final ValueFactory vf = new ValueFactoryImpl(); |
| final Set<Statement> historicTriples = Sets.newHashSet( |
| vf.createStatement(vf.createURI("http://Alice"), vf.createURI("http://talksTo"), vf.createURI("http://Eve")), |
| vf.createStatement(vf.createURI("http://Alice"), vf.createURI("http://worksAt"), vf.createURI("http://Chipotle"))); |
| |
| // Triples that will be streamed into Fluo after the PCJ has been created. |
| final Set<RyaStatement> streamedTriples = Sets.newHashSet( |
| new RyaStatement(new RyaURI("http://Frank"), new RyaURI("http://talksTo"), new RyaURI("http://Eve")), |
| new RyaStatement(new RyaURI("http://Frank"), new RyaURI("http://worksAt"), new RyaURI("http://Chipotle"))); |
| |
| // Load the historic data into Rya. |
| final SailRepositoryConnection ryaConn = super.getRyaSailRepository().getConnection(); |
| for(final Statement triple : historicTriples) { |
| ryaConn.add(triple); |
| } |
| ryaConn.close(); |
| |
| // Create the PCJ table. |
| final Connector accumuloConn = super.getAccumuloConnector(); |
| final PrecomputedJoinStorage pcjStorage = new AccumuloPcjStorage(accumuloConn, getRyaInstanceName()); |
| final String pcjId = pcjStorage.createPcj(sparql); |
| |
| try(FluoClient fluoClient = FluoFactory.newClient(super.getFluoConfiguration())) { |
| // Tell the Fluo app to maintain the PCJ. |
| new CreateFluoPcj().withRyaIntegration(pcjId, pcjStorage, fluoClient, accumuloConn, getRyaInstanceName()); |
| |
| // Ensure Alice is a match. |
| super.getMiniFluo().waitForObservers(); |
| |
| final Set<BindingSet> expected = new HashSet<>(); |
| |
| MapBindingSet bs = new MapBindingSet(); |
| bs.addBinding("x", vf.createURI("http://Alice")); |
| expected.add(bs); |
| |
| Set<BindingSet> results = new HashSet<>(); |
| try(CloseableIterator<BindingSet> resultsIt = pcjStorage.listResults(pcjId)) { |
| while(resultsIt.hasNext()) { |
| results.add(resultsIt.next()); |
| } |
| } |
| |
| assertEquals(expected, results); |
| |
| // Stream the data into Fluo. |
| new InsertTriples().insert(fluoClient, streamedTriples, Optional.<String>absent()); |
| |
| // Verify the end results of the query also include Frank. |
| super.getMiniFluo().waitForObservers(); |
| |
| bs = new MapBindingSet(); |
| bs.addBinding("x", vf.createURI("http://Frank")); |
| expected.add(bs); |
| |
| results = new HashSet<>(); |
| try(CloseableIterator<BindingSet> resultsIt = pcjStorage.listResults(pcjId)) { |
| while(resultsIt.hasNext()) { |
| results.add(resultsIt.next()); |
| } |
| } |
| |
| assertEquals(expected, results); |
| } |
| } |
| |
| /** |
| * Simulates the case where a Triple is added to Rya, a new query that |
| * includes the triple as a historic match is inserted into Fluo, and then |
| * the same triple is streamed into Fluo. The query's results will already |
| * include the Triple because they were added while the query was being |
| * created. This case should not fail or effect the end results in any way. |
| */ |
| @Test |
| public void historicAndStreamConflict() throws Exception { |
| // A query that finds people who talk to Eve and work at Chipotle. |
| final String sparql = |
| "SELECT ?x WHERE { " + |
| "?x <http://talksTo> <http://Eve>. " + |
| "?x <http://worksAt> <http://Chipotle>." + |
| "}"; |
| |
| // Triples that are loaded into Rya before the PCJ is created. |
| final ValueFactory vf = new ValueFactoryImpl(); |
| final Set<Statement> historicTriples = Sets.newHashSet( |
| vf.createStatement(vf.createURI("http://Alice"), vf.createURI("http://talksTo"), vf.createURI("http://Eve")), |
| vf.createStatement(vf.createURI("http://Alice"), vf.createURI("http://worksAt"), vf.createURI("http://Chipotle"))); |
| |
| // Triples that will be streamed into Fluo after the PCJ has been created. |
| final Set<RyaStatement> streamedTriples = Sets.newHashSet( |
| new RyaStatement(new RyaURI("http://Alice"), new RyaURI("http://talksTo"), new RyaURI("http://Eve")), |
| new RyaStatement(new RyaURI("http://Alice"), new RyaURI("http://worksAt"), new RyaURI("http://Chipotle"))); |
| |
| // The expected final result. |
| final Set<BindingSet> expected = new HashSet<>(); |
| |
| final MapBindingSet bs = new MapBindingSet(); |
| bs.addBinding("x", vf.createURI("http://Alice")); |
| expected.add(bs); |
| |
| // Load the historic data into Rya. |
| final SailRepositoryConnection ryaConn = super.getRyaSailRepository().getConnection(); |
| for(final Statement triple : historicTriples) { |
| ryaConn.add(triple); |
| } |
| ryaConn.close(); |
| |
| // Create the PCJ table. |
| final Connector accumuloConn = super.getAccumuloConnector(); |
| final PrecomputedJoinStorage pcjStorage = new AccumuloPcjStorage(accumuloConn, getRyaInstanceName()); |
| final String pcjId = pcjStorage.createPcj(sparql); |
| |
| try(FluoClient fluoClient = FluoFactory.newClient(super.getFluoConfiguration())) { |
| // Tell the Fluo app to maintain the PCJ. |
| new CreateFluoPcj().withRyaIntegration(pcjId, pcjStorage, fluoClient, accumuloConn, getRyaInstanceName()); |
| |
| // Ensure Alice is a match. |
| super.getMiniFluo().waitForObservers(); |
| |
| Set<BindingSet> results = new HashSet<>(); |
| try(CloseableIterator<BindingSet> resultsIt = pcjStorage.listResults(pcjId)) { |
| while(resultsIt.hasNext()) { |
| results.add( resultsIt.next() ); |
| } |
| } |
| assertEquals(expected, results); |
| |
| // Stream the same Alice triple into Fluo. |
| new InsertTriples().insert(fluoClient, streamedTriples, Optional.<String>absent()); |
| |
| // Verify the end results of the query is stiill only Alice. |
| super.getMiniFluo().waitForObservers(); |
| |
| results = new HashSet<>(); |
| try(CloseableIterator<BindingSet> resultsIt = pcjStorage.listResults(pcjId)) { |
| while(resultsIt.hasNext()) { |
| results.add( resultsIt.next() ); |
| } |
| } |
| assertEquals(expected, results); |
| } |
| } |
| } |