blob: e8b5faf9bf38698e7d574b3315307e18c6f379f3 [file] [log] [blame]
# copyright 2016 twitter. all rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
'''Example WordCountTopology'''
import sys
from heronpy.dsl.streamlet import TimeWindow
from heronpy.connectors.pulsar.pulsarstreamlet import PulsarStreamlet
if __name__ == '__main__':
if len(sys.argv) != 4:
print "Usage pulsar_would_count_dsl.pex <topology_name> <pulsar_service_url> <pulsar_topic>"
sys.exit(1)
counts = PulsarStreamlet.pulsarStreamlet(sys.argv[2], sys.argv[3], parallelism=2) \
.flat_map(lambda line: line.split(), parallelism=2) \
.map(lambda word: (word, 1), parallelism=2) \
.reduce_by_window(TimeWindow(10, 2), lambda x, y: x + y)
counts.run(sys.argv[1])