| #!/usr/bin/env python |
| # -*- encoding: utf-8 -*- |
| |
| # Licensed to the Apache Software Foundation (ASF) under one |
| # or more contributor license agreements. See the NOTICE file |
| # distributed with this work for additional information |
| # regarding copyright ownership. The ASF licenses this file |
| # to you under the Apache License, Version 2.0 (the |
| # "License"); you may not use this file except in compliance |
| # with the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, |
| # software distributed under the License is distributed on an |
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| # KIND, either express or implied. See the License for the |
| # specific language governing permissions and limitations |
| # under the License. |
| |
| ''' execeptionsummaryhandler.py ''' |
| import traceback |
| import tornado.gen |
| import tornado.web |
| |
| from heron.common.src.python.utils.log import Log |
| from heron.proto import common_pb2 |
| from heron.proto import tmaster_pb2 |
| from heron.tools.tracker.src.python import constants |
| from heron.tools.tracker.src.python.handlers import BaseHandler |
| |
| # pylint: disable=attribute-defined-outside-init |
| class ExceptionSummaryHandler(BaseHandler): |
| """ |
| URL - /topologies/exceptionsummary?cluster=<cluster>&topology=<topology> \ |
| &environ=<environment>&component=<component> |
| Parameters: |
| - cluster - Name of cluster. |
| - environ - Running environment. |
| - role - (optional) Role used to submit the topology. |
| - topology - Name of topology (Note: Case sensitive. Can only |
| include [a-zA-Z0-9-_]+) |
| - component - Component name |
| - instance - (optional, repeated) |
| |
| Returns summary of the exceptions for the component of the topology. |
| Duplicated exceptions are combined together and shows the number of |
| occurances, first occurance time and latest occurance time. |
| """ |
| def initialize(self, tracker): |
| """ initialize """ |
| self.tracker = tracker |
| |
| @tornado.gen.coroutine |
| def get(self): |
| """ get """ |
| try: |
| cluster = self.get_argument_cluster() |
| environ = self.get_argument_environ() |
| role = self.get_argument_role() |
| topology_name = self.get_argument_topology() |
| component = self.get_argument_component() |
| topology = self.tracker.getTopologyByClusterRoleEnvironAndName( |
| cluster, role, environ, topology_name) |
| instances = self.get_arguments(constants.PARAM_INSTANCE) |
| exceptions_summary = yield tornado.gen.Task(self.getComponentExceptionSummary, |
| topology.tmaster, component, instances) |
| self.write_success_response(exceptions_summary) |
| except Exception as e: |
| Log.debug(traceback.format_exc()) |
| self.write_error_response(e) |
| |
| # pylint: disable=dangerous-default-value, no-self-use, unused-argument |
| @tornado.gen.coroutine |
| def getComponentExceptionSummary(self, tmaster, component_name, instances=[], callback=None): |
| """ |
| Get the summary of exceptions for component_name and list of instances. |
| Empty instance list will fetch all exceptions. |
| """ |
| if not tmaster or not tmaster.host or not tmaster.stats_port: |
| return |
| exception_request = tmaster_pb2.ExceptionLogRequest() |
| exception_request.component_name = component_name |
| if len(instances) > 0: |
| exception_request.instances.extend(instances) |
| request_str = exception_request.SerializeToString() |
| port = str(tmaster.stats_port) |
| host = tmaster.host |
| url = "http://{0}:{1}/exceptionsummary".format(host, port) |
| Log.debug("Creating request object.") |
| request = tornado.httpclient.HTTPRequest(url, |
| body=request_str, |
| method='POST', |
| request_timeout=5) |
| Log.debug('Making HTTP call to fetch exceptionsummary url: %s', url) |
| try: |
| client = tornado.httpclient.AsyncHTTPClient() |
| result = yield client.fetch(request) |
| Log.debug("HTTP call complete.") |
| except tornado.httpclient.HTTPError as e: |
| raise Exception(str(e)) |
| |
| # Check the response code - error if it is in 400s or 500s |
| responseCode = result.code |
| if responseCode >= 400: |
| message = "Error in getting exceptions from Tmaster, code: " + responseCode |
| Log.error(message) |
| raise tornado.gen.Return({ |
| "message": message |
| }) |
| |
| # Parse the response from tmaster. |
| exception_response = tmaster_pb2.ExceptionLogResponse() |
| exception_response.ParseFromString(result.body) |
| |
| if exception_response.status.status == common_pb2.NOTOK: |
| if exception_response.status.HasField("message"): |
| raise tornado.gen.Return({ |
| "message": exception_response.status.message |
| }) |
| |
| # Send response |
| ret = [] |
| for exception_log in exception_response.exceptions: |
| ret.append({'class_name': exception_log.stacktrace, |
| 'lasttime': exception_log.lasttime, |
| 'firsttime': exception_log.firsttime, |
| 'count': str(exception_log.count)}) |
| raise tornado.gen.Return(ret) |