blob: 95a7684c89434f3fbd505070e2d0c97ca10dd053 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.streams.example.elasticsearch.test;
import com.fasterxml.jackson.databind.ObjectMapper;
import com.fasterxml.jackson.databind.node.ObjectNode;
import com.google.common.collect.Lists;
import org.apache.commons.io.Charsets;
import org.apache.commons.io.IOUtils;
import org.apache.streams.core.StreamsDatum;
import org.apache.streams.elasticsearch.ElasticsearchConfiguration;
import org.apache.streams.elasticsearch.ElasticsearchPersistWriter;
import org.apache.streams.elasticsearch.ElasticsearchWriterConfiguration;
import org.apache.streams.elasticsearch.example.ElasticsearchReindex;
import org.apache.streams.elasticsearch.example.ElasticsearchReindexConfiguration;
import org.apache.streams.jackson.StreamsJacksonMapper;
import org.apache.streams.pojo.json.Activity;
import org.apache.streams.pojo.json.ActivityObject;
import org.elasticsearch.action.admin.indices.template.put.PutIndexTemplateRequestBuilder;
import org.elasticsearch.test.ElasticsearchIntegrationTest;
import org.junit.Before;
import org.junit.Test;
import org.reflections.Reflections;
import org.reflections.scanners.SubTypesScanner;
import org.reflections.util.ClasspathHelper;
import org.reflections.util.ConfigurationBuilder;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import java.io.InputStream;
import java.net.URL;
import java.util.List;
import java.util.Set;
/**
* Test copying parent/child associated documents between two indexes on same cluster
*/
@ElasticsearchIntegrationTest.ClusterScope(scope= ElasticsearchIntegrationTest.Scope.TEST, numNodes=1)
public class ElasticsearchReindexParentChildIT extends ElasticsearchIntegrationTest {
private final static Logger LOGGER = LoggerFactory.getLogger(ElasticsearchReindexIT.class);
ObjectMapper MAPPER = StreamsJacksonMapper.getInstance();
ElasticsearchConfiguration testConfiguration = new ElasticsearchConfiguration();
@Before
public void prepareTest() throws Exception {
testConfiguration = new ElasticsearchConfiguration();
testConfiguration.setHosts(Lists.newArrayList("localhost"));
testConfiguration.setClusterName(cluster().getClusterName());
PutIndexTemplateRequestBuilder putTemplateRequestBuilder = client().admin().indices().preparePutTemplate("mappings");
URL templateURL = ElasticsearchReindexParentChildIT.class.getResource("/ActivityChildObjectParent.json");
ObjectNode template = MAPPER.readValue(templateURL, ObjectNode.class);
String templateSource = MAPPER.writeValueAsString(template);
putTemplateRequestBuilder.setSource(templateSource);
client().admin().indices().putTemplate(putTemplateRequestBuilder.request()).actionGet();
Reflections reflections = new Reflections(new ConfigurationBuilder()
.setUrls(ClasspathHelper.forPackage("org.apache.streams.pojo.json"))
.setScanners(new SubTypesScanner()));
Set<Class<? extends ActivityObject>> objectTypes = reflections.getSubTypesOf(ActivityObject.class);
ElasticsearchWriterConfiguration setupWriterConfiguration = MAPPER.convertValue(testConfiguration, ElasticsearchWriterConfiguration.class);
setupWriterConfiguration.setIndex("source");
setupWriterConfiguration.setBatchSize(5l);
ElasticsearchPersistWriter setupWriter = new ElasticsearchPersistWriter(setupWriterConfiguration);
setupWriter.prepare(null);
for( Class objectType : objectTypes ) {
Object object = objectType.newInstance();
ActivityObject activityObject = MAPPER.convertValue(object, ActivityObject.class);
StreamsDatum datum = new StreamsDatum(activityObject, activityObject.getObjectType());
datum.getMetadata().put("type", "object");
setupWriter.write( datum );
}
InputStream testActivityFolderStream = ElasticsearchReindexIT.class.getClassLoader()
.getResourceAsStream("activities");
List<String> files = IOUtils.readLines(testActivityFolderStream, Charsets.UTF_8);
for( String file : files) {
LOGGER.info("File: " + file );
InputStream testActivityFileStream = ElasticsearchReindexIT.class.getClassLoader()
.getResourceAsStream("activities/" + file);
Activity activity = MAPPER.readValue(testActivityFileStream, Activity.class);
StreamsDatum datum = new StreamsDatum(activity, activity.getVerb());
datum.getMetadata().put("parent", activity.getObject().getObjectType());
datum.getMetadata().put("type", "activity");
setupWriter.write( datum );
LOGGER.info("Wrote: " + activity.getVerb() );
}
setupWriter.cleanUp();
flushAndRefresh();
}
@Test
public void testReindex() throws Exception {
assert(indexExists("source"));
long srcCount = client().count(client().prepareCount("source").request()).get().getCount();
assert srcCount > 0;
ElasticsearchReindexConfiguration reindexConfiguration = MAPPER.readValue(
ElasticsearchReindexParentChildIT.class.getResourceAsStream("/testReindexParent.json"), ElasticsearchReindexConfiguration.class);
reindexConfiguration.getDestination().setClusterName(cluster().getClusterName());
reindexConfiguration.getSource().setClusterName(cluster().getClusterName());
ElasticsearchReindex reindex = new ElasticsearchReindex(reindexConfiguration);
Thread reindexThread = new Thread(reindex);
reindexThread.start();
reindexThread.join();
flushAndRefresh();
ElasticsearchReindexConfiguration reindexConfiguration2 = MAPPER.readValue(
ElasticsearchReindexParentChildIT.class.getResourceAsStream("/testReindexChild.json"), ElasticsearchReindexConfiguration.class);
reindexConfiguration2.getDestination().setClusterName(cluster().getClusterName());
reindexConfiguration2.getSource().setClusterName(cluster().getClusterName());
ElasticsearchReindex reindex2 = new ElasticsearchReindex(reindexConfiguration2);
Thread reindexThread2 = new Thread(reindex2);
reindexThread2.start();
reindexThread2.join();
flushAndRefresh();
assert(indexExists("destination"));
long destCount = client().count(client().prepareCount("destination").request()).get().getCount();
assert srcCount == destCount;
}
}