| /* |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.flink.streaming.tests; |
| |
| import org.apache.flink.api.common.functions.FlatMapFunction; |
| import org.apache.flink.api.common.functions.RuntimeContext; |
| import org.apache.flink.api.java.tuple.Tuple2; |
| import org.apache.flink.api.java.utils.ParameterTool; |
| import org.apache.flink.streaming.api.datastream.DataStream; |
| import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment; |
| import org.apache.flink.streaming.connectors.elasticsearch.RequestIndexer; |
| import org.apache.flink.streaming.connectors.elasticsearch5.ElasticsearchSink; |
| import org.apache.flink.util.Collector; |
| |
| import org.elasticsearch.action.index.IndexRequest; |
| import org.elasticsearch.action.update.UpdateRequest; |
| import org.elasticsearch.client.Requests; |
| |
| import java.net.InetAddress; |
| import java.net.InetSocketAddress; |
| import java.util.ArrayList; |
| import java.util.HashMap; |
| import java.util.List; |
| import java.util.Map; |
| |
| /** End to end test for Elasticsearch5Sink. */ |
| public class Elasticsearch5SinkExample { |
| |
| public static void main(String[] args) throws Exception { |
| |
| final ParameterTool parameterTool = ParameterTool.fromArgs(args); |
| |
| if (parameterTool.getNumberOfParameters() < 3) { |
| System.out.println( |
| "Missing parameters!\n" |
| + "Usage: --numRecords <numRecords> --index <index> --type <type>"); |
| return; |
| } |
| |
| final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); |
| env.enableCheckpointing(5000); |
| |
| DataStream<Tuple2<String, String>> source = |
| env.generateSequence(0, parameterTool.getInt("numRecords") - 1) |
| .flatMap( |
| new FlatMapFunction<Long, Tuple2<String, String>>() { |
| @Override |
| public void flatMap( |
| Long value, Collector<Tuple2<String, String>> out) { |
| final String key = String.valueOf(value); |
| final String message = "message #" + value; |
| out.collect(Tuple2.of(key, message + "update #1")); |
| out.collect(Tuple2.of(key, message + "update #2")); |
| } |
| }); |
| |
| Map<String, String> userConfig = new HashMap<>(); |
| userConfig.put("cluster.name", "elasticsearch"); |
| // This instructs the sink to emit after every element, otherwise they would be buffered |
| userConfig.put(ElasticsearchSink.CONFIG_KEY_BULK_FLUSH_MAX_ACTIONS, "1"); |
| |
| List<InetSocketAddress> transports = new ArrayList<>(); |
| transports.add(new InetSocketAddress(InetAddress.getByName("127.0.0.1"), 9300)); |
| |
| source.addSink( |
| new ElasticsearchSink<>( |
| userConfig, |
| transports, |
| (Tuple2<String, String> element, |
| RuntimeContext ctx, |
| RequestIndexer indexer) -> { |
| indexer.add(createIndexRequest(element.f1, parameterTool)); |
| indexer.add(createUpdateRequest(element, parameterTool)); |
| })); |
| |
| env.execute("Elasticsearch5.x end to end sink test example"); |
| } |
| |
| private static IndexRequest createIndexRequest(String element, ParameterTool parameterTool) { |
| Map<String, Object> json = new HashMap<>(); |
| json.put("data", element); |
| |
| return Requests.indexRequest() |
| .index(parameterTool.getRequired("index")) |
| .type(parameterTool.getRequired("type")) |
| .id(element) |
| .source(json); |
| } |
| |
| private static UpdateRequest createUpdateRequest( |
| Tuple2<String, String> element, ParameterTool parameterTool) { |
| Map<String, Object> json = new HashMap<>(); |
| json.put("data", element.f1); |
| |
| return new UpdateRequest( |
| parameterTool.getRequired("index"), |
| parameterTool.getRequired("type"), |
| element.f0) |
| .doc(json) |
| .upsert(json); |
| } |
| } |