blob: 83bfa1dfa3364d6ad8abf4032fb4c60ddbe5b622 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.connector.opensearch.sink;
import org.apache.flink.annotation.PublicEvolving;
import org.apache.flink.annotation.VisibleForTesting;
import org.apache.flink.api.connector.sink2.Sink;
import org.apache.flink.api.connector.sink2.SinkWriter;
import org.apache.flink.api.connector.sink2.WriterInitContext;
import org.apache.flink.connector.base.DeliveryGuarantee;
import org.apache.flink.connector.opensearch.sink.BulkResponseInspector.BulkResponseInspectorFactory;
import org.apache.http.HttpHost;
import java.io.IOException;
import java.util.List;
import static org.apache.flink.util.Preconditions.checkArgument;
import static org.apache.flink.util.Preconditions.checkNotNull;
/**
* Flink Sink to insert or update data in an Opensearch index. The sink supports the following
* delivery guarantees.
*
* <ul>
* <li>{@link DeliveryGuarantee#NONE} does not provide any guarantees: actions are flushed to
* Opensearch only depending on the configurations of the bulk processor. In case of a
* failure, it might happen that actions are lost if the bulk processor still has buffered
* actions.
* <li>{@link DeliveryGuarantee#AT_LEAST_ONCE} on a checkpoint the sink will wait until all
* buffered actions are flushed to and acknowledged by Opensearch. No actions will be lost but
* actions might be sent to Opensearch multiple times when Flink restarts. These additional
* requests may cause inconsistent data in Opensearch right after the restart, but eventually
* everything will be consistent again.
* </ul>
*
* @param <IN> type of the records converted to Opensearch actions
* @see OpensearchSinkBuilder on how to construct a OpensearchSink
*/
@PublicEvolving
public class OpensearchSink<IN> implements Sink<IN> {
private final List<HttpHost> hosts;
private final OpensearchEmitter<? super IN> emitter;
private final BulkProcessorConfig buildBulkProcessorConfig;
private final NetworkClientConfig networkClientConfig;
private final DeliveryGuarantee deliveryGuarantee;
private final RestClientFactory restClientFactory;
private final BulkResponseInspectorFactory bulkResponseInspectorFactory;
OpensearchSink(
List<HttpHost> hosts,
OpensearchEmitter<? super IN> emitter,
DeliveryGuarantee deliveryGuarantee,
BulkProcessorConfig buildBulkProcessorConfig,
NetworkClientConfig networkClientConfig,
RestClientFactory restClientFactory,
BulkResponseInspectorFactory bulkResponseInspectorFactory) {
this.hosts = checkNotNull(hosts);
checkArgument(!hosts.isEmpty(), "Hosts cannot be empty.");
this.emitter = checkNotNull(emitter);
this.deliveryGuarantee = checkNotNull(deliveryGuarantee);
this.buildBulkProcessorConfig = checkNotNull(buildBulkProcessorConfig);
this.networkClientConfig = checkNotNull(networkClientConfig);
this.restClientFactory = checkNotNull(restClientFactory);
this.bulkResponseInspectorFactory = checkNotNull(bulkResponseInspectorFactory);
}
@Override
public SinkWriter<IN> createWriter(WriterInitContext context) throws IOException {
return new OpensearchWriter<>(
hosts,
emitter,
deliveryGuarantee == DeliveryGuarantee.AT_LEAST_ONCE,
buildBulkProcessorConfig,
networkClientConfig,
context.metricGroup(),
context.getMailboxExecutor(),
restClientFactory,
bulkResponseInspectorFactory.apply(context::metricGroup));
}
@VisibleForTesting
DeliveryGuarantee getDeliveryGuarantee() {
return deliveryGuarantee;
}
@VisibleForTesting
BulkResponseInspectorFactory getBulkResponseInspectorFactory() {
return bulkResponseInspectorFactory;
}
}