blob: 6a3477651f1a53431fe3b226371f33ead4b186b9 [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
package org.apache.doris.flink.sink;
import org.apache.flink.api.connector.sink2.Committer;
import org.apache.flink.api.connector.sink2.StatefulSink;
import org.apache.flink.api.connector.sink2.TwoPhaseCommittingSink;
import org.apache.flink.core.io.SimpleVersionedSerializer;
import org.apache.flink.util.Preconditions;
import org.apache.doris.flink.cfg.DorisExecutionOptions;
import org.apache.doris.flink.cfg.DorisOptions;
import org.apache.doris.flink.cfg.DorisReadOptions;
import org.apache.doris.flink.rest.RestService;
import org.apache.doris.flink.sink.batch.DorisBatchWriter;
import org.apache.doris.flink.sink.committer.DorisCommitter;
import org.apache.doris.flink.sink.writer.DorisAbstractWriter;
import org.apache.doris.flink.sink.writer.DorisWriter;
import org.apache.doris.flink.sink.writer.DorisWriterState;
import org.apache.doris.flink.sink.writer.DorisWriterStateSerializer;
import org.apache.doris.flink.sink.writer.WriteMode;
import org.apache.doris.flink.sink.writer.serializer.DorisRecordSerializer;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import java.io.IOException;
import java.util.Collection;
import java.util.Collections;
/**
* Load data into Doris based on 2PC. see {@link DorisWriter} and {@link DorisCommitter}.
*
* @param <IN> type of record.
*/
public class DorisSink<IN>
implements StatefulSink<IN, DorisWriterState>,
TwoPhaseCommittingSink<IN, DorisCommittable> {
private static final Logger LOG = LoggerFactory.getLogger(DorisSink.class);
private final DorisOptions dorisOptions;
private final DorisReadOptions dorisReadOptions;
private final DorisExecutionOptions dorisExecutionOptions;
private final DorisRecordSerializer<IN> serializer;
public DorisSink(
DorisOptions dorisOptions,
DorisReadOptions dorisReadOptions,
DorisExecutionOptions dorisExecutionOptions,
DorisRecordSerializer<IN> serializer) {
this.dorisOptions = dorisOptions;
this.dorisReadOptions = dorisReadOptions;
this.dorisExecutionOptions = dorisExecutionOptions;
this.serializer = serializer;
checkKeyType();
}
/** The uniq model has 2pc close by default unless 2pc is forced open. */
private void checkKeyType() {
if (dorisExecutionOptions.enabled2PC()
&& !dorisExecutionOptions.force2PC()
&& RestService.isUniqueKeyType(dorisOptions, dorisReadOptions, LOG)) {
dorisExecutionOptions.setEnable2PC(false);
}
}
@Override
public DorisAbstractWriter createWriter(InitContext initContext) throws IOException {
return getDorisAbstractWriter(initContext, Collections.emptyList());
}
@Override
public Committer<DorisCommittable> createCommitter() throws IOException {
return new DorisCommitter(
dorisOptions, dorisReadOptions, dorisExecutionOptions.getMaxRetries());
}
@Override
public DorisAbstractWriter restoreWriter(
InitContext initContext, Collection<DorisWriterState> recoveredState)
throws IOException {
return getDorisAbstractWriter(initContext, recoveredState);
}
public DorisAbstractWriter getDorisAbstractWriter(
InitContext initContext, Collection<DorisWriterState> states) {
if (WriteMode.STREAM_LOAD.equals(dorisExecutionOptions.getWriteMode())) {
return new DorisWriter<>(
initContext,
states,
serializer,
dorisOptions,
dorisReadOptions,
dorisExecutionOptions);
} else if (WriteMode.STREAM_LOAD_BATCH.equals(dorisExecutionOptions.getWriteMode())) {
return new DorisBatchWriter<>(
initContext, serializer, dorisOptions, dorisReadOptions, dorisExecutionOptions);
}
throw new IllegalArgumentException(
"Unsupported write mode " + dorisExecutionOptions.getWriteMode());
}
@Override
public SimpleVersionedSerializer<DorisWriterState> getWriterStateSerializer() {
return new DorisWriterStateSerializer();
}
@Override
public SimpleVersionedSerializer<DorisCommittable> getCommittableSerializer() {
return new DorisCommittableSerializer();
}
public static <IN> Builder<IN> builder() {
return new Builder<>();
}
/**
* build for DorisSink.
*
* @param <IN> record type.
*/
public static class Builder<IN> {
private DorisOptions dorisOptions;
private DorisReadOptions dorisReadOptions;
private DorisExecutionOptions dorisExecutionOptions;
private DorisRecordSerializer<IN> serializer;
public Builder<IN> setDorisOptions(DorisOptions dorisOptions) {
this.dorisOptions = dorisOptions;
return this;
}
public Builder<IN> setDorisReadOptions(DorisReadOptions dorisReadOptions) {
this.dorisReadOptions = dorisReadOptions;
return this;
}
public Builder<IN> setDorisExecutionOptions(DorisExecutionOptions dorisExecutionOptions) {
this.dorisExecutionOptions = dorisExecutionOptions;
return this;
}
public Builder<IN> setSerializer(DorisRecordSerializer<IN> serializer) {
this.serializer = serializer;
return this;
}
public DorisSink<IN> build() {
Preconditions.checkNotNull(dorisOptions);
Preconditions.checkNotNull(dorisExecutionOptions);
Preconditions.checkNotNull(serializer);
if (dorisReadOptions == null) {
dorisReadOptions = DorisReadOptions.builder().build();
}
return new DorisSink<>(
dorisOptions, dorisReadOptions, dorisExecutionOptions, serializer);
}
}
}