blob: f6c43b2e82e3054506b8c30e1930875618a1b59e [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.streaming.runtime.operators.sink;
import org.apache.flink.annotation.Internal;
import org.apache.flink.api.common.state.ListState;
import org.apache.flink.api.common.state.ListStateDescriptor;
import org.apache.flink.api.common.typeutils.base.array.BytePrimitiveArraySerializer;
import org.apache.flink.api.connector.sink2.Sink.InitContext;
import org.apache.flink.api.connector.sink2.SinkWriter;
import org.apache.flink.api.connector.sink2.StatefulSink;
import org.apache.flink.api.connector.sink2.StatefulSink.StatefulSinkWriter;
import org.apache.flink.api.connector.sink2.StatefulSink.WithCompatibleState;
import org.apache.flink.core.io.SimpleVersionedSerializer;
import org.apache.flink.runtime.state.StateInitializationContext;
import org.apache.flink.streaming.api.operators.util.SimpleVersionedListState;
import org.apache.flink.util.CollectionUtil;
import org.apache.flink.shaded.guava30.com.google.common.collect.Iterables;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.List;
/** {@link SinkWriterStateHandler} for stateful sinks. */
@Internal
final class StatefulSinkWriterStateHandler<InputT, WriterStateT>
implements SinkWriterStateHandler<InputT> {
/** The operator's state descriptor. */
private static final ListStateDescriptor<byte[]> WRITER_RAW_STATES_DESC =
new ListStateDescriptor<>("writer_raw_states", BytePrimitiveArraySerializer.INSTANCE);
/** The writer operator's state serializer. */
private final SimpleVersionedSerializer<WriterStateT> writerStateSimpleVersionedSerializer;
/**
* The previous sink operator's state name. We allow restoring state from a different
* (compatible) sink implementation such as {@link
* org.apache.flink.streaming.api.functions.sink.filesystem.StreamingFileSink}. This allows
* migration to newer Sink implementations.
*/
private final Collection<String> previousSinkStateNames;
private final StatefulSink<InputT, WriterStateT> sink;
// ------------------------------- runtime fields ---------------------------------------
/**
* The previous sink operator's state. We allow restoring state from a different (compatible)
* sink implementation such as {@link
* org.apache.flink.streaming.api.functions.sink.filesystem.StreamingFileSink}. This allows
* migration to newer Sink implementations.
*/
private List<ListState<WriterStateT>> previousSinkStates = new ArrayList<>();
/** The operator's state. */
private ListState<WriterStateT> writerState;
private StatefulSinkWriter<InputT, WriterStateT> sinkWriter;
public StatefulSinkWriterStateHandler(StatefulSink<InputT, WriterStateT> sink) {
this.sink = sink;
Collection<String> previousSinkStateNames =
sink instanceof StatefulSink.WithCompatibleState
? ((WithCompatibleState) sink).getCompatibleWriterStateNames()
: Collections.emptyList();
this.writerStateSimpleVersionedSerializer = sink.getWriterStateSerializer();
this.previousSinkStateNames = previousSinkStateNames;
}
@Override
public SinkWriter<InputT> createWriter(
InitContext initContext, StateInitializationContext context) throws Exception {
final ListState<byte[]> rawState =
context.getOperatorStateStore().getListState(WRITER_RAW_STATES_DESC);
writerState =
new SimpleVersionedListState<>(rawState, writerStateSimpleVersionedSerializer);
if (context.isRestored()) {
final List<WriterStateT> writerStates =
CollectionUtil.iterableToList(writerState.get());
final List<WriterStateT> states = new ArrayList<>(writerStates);
for (String previousSinkStateName : previousSinkStateNames) {
final ListStateDescriptor<byte[]> preSinkStateDesc =
new ListStateDescriptor<>(
previousSinkStateName, BytePrimitiveArraySerializer.INSTANCE);
final ListState<byte[]> preRawState =
context.getOperatorStateStore().getListState(preSinkStateDesc);
SimpleVersionedListState<WriterStateT> previousSinkState =
new SimpleVersionedListState<>(
preRawState, writerStateSimpleVersionedSerializer);
previousSinkStates.add(previousSinkState);
Iterables.addAll(states, previousSinkState.get());
}
sinkWriter = sink.restoreWriter(initContext, states);
} else {
sinkWriter = sink.createWriter(initContext);
}
return sinkWriter;
}
@Override
public void snapshotState(long checkpointId) throws Exception {
writerState.update(sinkWriter.snapshotState(checkpointId));
previousSinkStates.forEach(ListState::clear);
}
}