blob: a3fe0ad20ce381c7fd66c11d00d497dc8f6489e7 [file] [log] [blame]
#!/usr/bin/env python
# -*- encoding: utf-8 -*-
# copyright 2016 twitter. all rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
'''Example WordCountStreamletTopology'''
import sys
from heronpy.streamlet.streamlet import TimeWindow
from heronpy.connectors.pulsar.pulsarstreamlet import PulsarStreamlet
# pylint: disable=superfluous-parens
if __name__ == '__main__':
if len(sys.argv) != 4:
print("""
Usage: pulsar_would_count_streamlet.pex <topology_name> <pulsar_service_url> <pulsar_topic>
""")
sys.exit(1)
counts = PulsarStreamlet.pulsarStreamlet(sys.argv[2], sys.argv[3], parallelism=2) \
.flat_map(lambda line: line.split(), parallelism=2) \
.map(lambda word: (word, 1), parallelism=2) \
.reduce_by_window(TimeWindow(10, 2), lambda x, y: x + y)
counts.run(sys.argv[1])