blob: 2af05cd7fb0aaf0001e43ddf1fde914ee13842b7 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.training.solutions.ridesandfares.scala
import org.apache.flink.api.common.state.{ValueState, ValueStateDescriptor}
import org.apache.flink.streaming.api.functions.co.RichCoFlatMapFunction
import org.apache.flink.streaming.api.scala.{StreamExecutionEnvironment, _}
import org.apache.flink.training.exercises.common.datatypes.{TaxiFare, TaxiRide}
import org.apache.flink.training.exercises.common.sources.{TaxiFareGenerator, TaxiRideGenerator}
import org.apache.flink.training.exercises.common.utils.ExerciseBase
import org.apache.flink.training.exercises.common.utils.ExerciseBase._
import org.apache.flink.util.Collector
/**
* Scala reference implementation for the "Stateful Enrichment" exercise of the Flink training in the docs.
*
* The goal for this exercise is to enrich TaxiRides with fare information.
*
*/
object RidesAndFaresSolution {
def main(args: Array[String]) {
// set up streaming execution environment
val env = StreamExecutionEnvironment.getExecutionEnvironment
env.setParallelism(ExerciseBase.parallelism)
val rides = env
.addSource(rideSourceOrTest(new TaxiRideGenerator()))
.filter { ride => ride.isStart }
.keyBy { ride => ride.rideId }
val fares = env
.addSource(fareSourceOrTest(new TaxiFareGenerator()))
.keyBy { fare => fare.rideId }
val processed = rides
.connect(fares)
.flatMap(new EnrichmentFunction)
printOrTest(processed)
env.execute("Join Rides with Fares (scala RichCoFlatMap)")
}
class EnrichmentFunction extends RichCoFlatMapFunction[TaxiRide, TaxiFare, (TaxiRide, TaxiFare)] {
// keyed, managed state
lazy val rideState: ValueState[TaxiRide] = getRuntimeContext.getState(
new ValueStateDescriptor[TaxiRide]("saved ride", classOf[TaxiRide]))
lazy val fareState: ValueState[TaxiFare] = getRuntimeContext.getState(
new ValueStateDescriptor[TaxiFare]("saved fare", classOf[TaxiFare]))
override def flatMap1(ride: TaxiRide, out: Collector[(TaxiRide, TaxiFare)]): Unit = {
val fare = fareState.value
if (fare != null) {
fareState.clear()
out.collect((ride, fare))
}
else {
rideState.update(ride)
}
}
override def flatMap2(fare: TaxiFare, out: Collector[(TaxiRide, TaxiFare)]): Unit = {
val ride = rideState.value
if (ride != null) {
rideState.clear()
out.collect((ride, fare))
}
else {
fareState.update(fare)
}
}
}
}