| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.flink.streaming.tests; |
| |
| import org.apache.flink.api.common.state.StateTtlConfig; |
| import org.apache.flink.api.common.time.Time; |
| import org.apache.flink.api.java.utils.ParameterTool; |
| import org.apache.flink.configuration.ConfigOption; |
| import org.apache.flink.configuration.ConfigOptions; |
| import org.apache.flink.runtime.state.StateBackend; |
| import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment; |
| import org.apache.flink.streaming.api.functions.sink.PrintSinkFunction; |
| |
| import static org.apache.flink.streaming.tests.DataStreamAllroundTestJobFactory.setupEnvironment; |
| |
| /** |
| * A test job for State TTL feature. |
| * |
| * <p>The test pipeline does the following: |
| * - generates random keyed state updates for each state TTL verifier (state type) |
| * - performs update of created state with TTL for each verifier |
| * - keeps previous updates in other state |
| * - verifies expected result of last update against preserved history of updates |
| * |
| * <p>Program parameters: |
| * <ul> |
| * <li>update_generator_source.keyspace (int, default - 100): Number of different keys for updates emitted by the update generator.</li> |
| * <li>update_generator_source.sleep_time (long, default - 0): Milliseconds to sleep after emitting updates in the update generator. Set to 0 to disable sleeping.</li> |
| * <li>update_generator_source.sleep_after_elements (long, default - 0): Number of updates to emit before sleeping in the update generator. Set to 0 to disable sleeping.</li> |
| * <li>state_ttl_verifier.ttl_milli (long, default - 1000): State time-to-live.</li> |
| * <li>report_stat.after_updates_num (long, default - 200): Report state update statistics after certain number of updates (average update chain length and clashes).</li> |
| * </ul> |
| */ |
| public class DataStreamStateTTLTestProgram { |
| private static final ConfigOption<Integer> UPDATE_GENERATOR_SRC_KEYSPACE = ConfigOptions |
| .key("update_generator_source.keyspace") |
| .defaultValue(100); |
| |
| private static final ConfigOption<Long> UPDATE_GENERATOR_SRC_SLEEP_TIME = ConfigOptions |
| .key("update_generator_source.sleep_time") |
| .defaultValue(0L); |
| |
| private static final ConfigOption<Long> UPDATE_GENERATOR_SRC_SLEEP_AFTER_ELEMENTS = ConfigOptions |
| .key("update_generator_source.sleep_after_elements") |
| .defaultValue(0L); |
| |
| private static final ConfigOption<Long> STATE_TTL_VERIFIER_TTL_MILLI = ConfigOptions |
| .key("state_ttl_verifier.ttl_milli") |
| .defaultValue(1000L); |
| |
| private static final ConfigOption<Long> REPORT_STAT_AFTER_UPDATES_NUM = ConfigOptions |
| .key("report_stat.after_updates_num") |
| .defaultValue(200L); |
| |
| public static void main(String[] args) throws Exception { |
| final ParameterTool pt = ParameterTool.fromArgs(args); |
| |
| final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); |
| |
| setupEnvironment(env, pt); |
| |
| final MonotonicTTLTimeProvider ttlTimeProvider = setBackendWithCustomTTLTimeProvider(env); |
| |
| int keySpace = pt.getInt(UPDATE_GENERATOR_SRC_KEYSPACE.key(), UPDATE_GENERATOR_SRC_KEYSPACE.defaultValue()); |
| long sleepAfterElements = pt.getLong(UPDATE_GENERATOR_SRC_SLEEP_AFTER_ELEMENTS.key(), |
| UPDATE_GENERATOR_SRC_SLEEP_AFTER_ELEMENTS.defaultValue()); |
| long sleepTime = pt.getLong(UPDATE_GENERATOR_SRC_SLEEP_TIME.key(), |
| UPDATE_GENERATOR_SRC_SLEEP_TIME.defaultValue()); |
| Time ttl = Time.milliseconds(pt.getLong(STATE_TTL_VERIFIER_TTL_MILLI.key(), |
| STATE_TTL_VERIFIER_TTL_MILLI.defaultValue())); |
| long reportStatAfterUpdatesNum = pt.getLong(REPORT_STAT_AFTER_UPDATES_NUM.key(), |
| REPORT_STAT_AFTER_UPDATES_NUM.defaultValue()); |
| |
| StateTtlConfig ttlConfig = StateTtlConfig.newBuilder(ttl).build(); |
| |
| env |
| .addSource(new TtlStateUpdateSource(keySpace, sleepAfterElements, sleepTime)) |
| .name("TtlStateUpdateSource") |
| .keyBy(TtlStateUpdate::getKey) |
| .flatMap(new TtlVerifyUpdateFunction(ttlConfig, ttlTimeProvider, reportStatAfterUpdatesNum)) |
| .name("TtlVerifyUpdateFunction") |
| .addSink(new PrintSinkFunction<>()) |
| .name("PrintFailedVerifications"); |
| |
| env.execute("State TTL test job"); |
| } |
| |
| /** |
| * Sets the state backend to a new {@link StubStateBackend} which has a {@link MonotonicTTLTimeProvider}. |
| * |
| * @param env The {@link StreamExecutionEnvironment} of the job. |
| * @return The {@link MonotonicTTLTimeProvider}. |
| */ |
| private static MonotonicTTLTimeProvider setBackendWithCustomTTLTimeProvider(StreamExecutionEnvironment env) { |
| final MonotonicTTLTimeProvider ttlTimeProvider = new MonotonicTTLTimeProvider(); |
| |
| final StateBackend configuredBackend = env.getStateBackend(); |
| final StateBackend stubBackend = new StubStateBackend(configuredBackend, ttlTimeProvider); |
| env.setStateBackend(stubBackend); |
| |
| return ttlTimeProvider; |
| } |
| } |