blob: 401eac048d7f30d10536573da84db92b6a579070 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.gearpump.streaming.examples.wordcount.dsl
import java.time.{Duration, Instant}
import org.apache.gearpump.Message
import org.apache.gearpump.cluster.client.ClientContext
import org.apache.gearpump.cluster.main.{ArgumentsParser, CLIOption}
import org.apache.gearpump.streaming.dsl.scalaapi.{LoggerSink, StreamApp}
import org.apache.gearpump.streaming.dsl.window.api.{EventTimeTrigger, FixedWindow}
import org.apache.gearpump.streaming.source.DataSource
import org.apache.gearpump.streaming.task.TaskContext
import org.apache.gearpump.util.AkkaApp
object WindowedWordCount extends AkkaApp with ArgumentsParser {
override val options: Array[(String, CLIOption[Any])] = Array.empty
override def main(akkaConf: Config, args: Array[String]): Unit = {
val context = ClientContext(akkaConf)
val app = StreamApp("dsl", context)
app.source[String](new TimedDataSource).
// word => (word, count)
flatMap(line => line.split("[\\s]+")).map((_, 1)).
// fix window
window(FixedWindow.apply(Duration.ofMillis(5L))
.triggering(EventTimeTrigger)).
// (word, count1), (word, count2) => (word, count1 + count2)
groupBy(_._1).
sum.sink(new LoggerSink)
context.submit(app)
context.close()
}
private class TimedDataSource extends DataSource {
private var data = List(
Message("foo", 1L),
Message("bar", 2L),
Message("foo", 3L),
Message("foo", 5L),
Message("bar", 7L),
Message("bar", 8L)
)
private var watermark: Instant = Instant.ofEpochMilli(0)
override def read(): Message = {
if (data.nonEmpty) {
val msg = data.head
data = data.tail
watermark = Instant.ofEpochMilli(msg.timestamp)
msg
} else {
null
}
}
override def open(context: TaskContext, startTime: Instant): Unit = {}
override def close(): Unit = {}
override def getWatermark: Instant = {
if (data.isEmpty) {
watermark = watermark.plusMillis(1)
}
watermark
}
}
}