| # copyright 2016 twitter. all rights reserved. |
| # |
| # Licensed under the Apache License, Version 2.0 (the "License"); |
| # you may not use this file except in compliance with the License. |
| # You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| '''Example WordCountTopology''' |
| import sys |
| |
| from heronpy.dsl.streamlet import TimeWindow |
| from heronpy.connectors.pulsar.pulsarstreamlet import PulsarStreamlet |
| |
| if __name__ == '__main__': |
| if len(sys.argv) != 4: |
| print "Usage pulsar_would_count_dsl.pex <topology_name> <pulsar_service_url> <pulsar_topic>" |
| sys.exit(1) |
| |
| counts = PulsarStreamlet.pulsarStreamlet(sys.argv[2], sys.argv[3], parallelism=2) \ |
| .flat_map(lambda line: line.split(), parallelism=2) \ |
| .map(lambda word: (word, 1), parallelism=2) \ |
| .reduce_by_window(TimeWindow(10, 2), lambda x, y: x + y) |
| counts.run(sys.argv[1]) |