085a685d54
The current implementation of alarm aggregation sets a snmp trapdest on all subclouds to signal the system controller that the alarm status of the subcloud has changed. This trap is handled by the dcorch-snmp process which will then trigger a rpc request to dcorch-engine which will in turn request an alarm summary update from the subcloud. While this implementation has a throttling mechanism, it has been observed to bog down dorch-engine performance as the number of subclouds is increased. To improve scalability: - eliminate the dcorch-snmp process and associated subcloud trapdest - move existing alarm aggregation handling from dcorch to dcmanager process along with the db table. Alarm status will be gathered by dcmanager-manager process as part of the subcloud audit. - remove periodic alarm audit - remove alarm rpc client - change frequent alarm related info logs to debug Test cases: - install dc system with multiple subclouds - add/manage subclouds - add alarms of various severity to subclouds - run alarm summary cli command and test alarm rest api calls - unmanage/poweroff/delete subclouds Change-Id: I8bd6c89f0b8a544e4d394af5bbbb86599a63823e Story: 2007267 Task: 38757 Signed-off-by: Gerry Kopec <gerry.kopec@windriver.com>
88 lines
2.9 KiB
Python
88 lines
2.9 KiB
Python
# Copyright (c) 2017 Ericsson AB.
|
|
# All Rights Reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License"); you may
|
|
# not use this file except in compliance with the License. You may obtain
|
|
# a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
# License for the specific language governing permissions and limitations
|
|
# under the License.
|
|
#
|
|
# Copyright (c) 2017-2020 Wind River Systems, Inc.
|
|
#
|
|
# The right to copy, distribute, modify, or otherwise make use
|
|
# of this software may be licensed only pursuant to the terms
|
|
# of an applicable Wind River license agreement.
|
|
#
|
|
|
|
from dcmanager.api.controllers import restcomm
|
|
from dcmanager.common import consts
|
|
from dcmanager.db import api as db_api
|
|
|
|
from oslo_log import log as logging
|
|
from pecan import expose
|
|
|
|
LOG = logging.getLogger(__name__)
|
|
|
|
|
|
class SubcloudAlarmController(object):
|
|
VERSION_ALIASES = {
|
|
'Newton': '1.0',
|
|
}
|
|
|
|
def __init__(self, *args, **kwargs):
|
|
super(SubcloudAlarmController, self).__init__(*args, **kwargs)
|
|
|
|
# to do the version compatibility for future purpose
|
|
def _determine_version_cap(self, target):
|
|
version_cap = 1.0
|
|
return version_cap
|
|
|
|
@expose(generic=True, template='json')
|
|
def index(self):
|
|
# Route the request to specific methods with parameters
|
|
pass
|
|
|
|
def _get_alarm_aggregates(self):
|
|
summary = []
|
|
context = restcomm.extract_context_from_environ()
|
|
alarms = db_api.subcloud_alarms_get_all(context)
|
|
for alarm in alarms:
|
|
alarm_dict = {'region_name': alarm['name'],
|
|
'uuid': alarm['uuid'],
|
|
'critical_alarms': alarm['critical_alarms'],
|
|
'major_alarms': alarm['major_alarms'],
|
|
'minor_alarms': alarm['minor_alarms'],
|
|
'warnings': alarm['warnings'],
|
|
'cloud_status': alarm['cloud_status']}
|
|
summary.append(alarm_dict)
|
|
return {'alarm_summary': summary}
|
|
|
|
@index.when(method='GET', template='json')
|
|
def get(self):
|
|
"""Get List of alarm summarys
|
|
|
|
"""
|
|
return self._get_alarm_aggregates()
|
|
|
|
def _get_alarm_summary(self):
|
|
alarms = self._get_alarm_aggregates()
|
|
summary = {consts.ALARM_CRITICAL_STATUS: 0,
|
|
consts.ALARM_DEGRADED_STATUS: 0,
|
|
consts.ALARM_OK_STATUS: 0}
|
|
for alarm in alarms['alarm_summary']:
|
|
summary[alarm['cloud_status']] += 1
|
|
return summary
|
|
|
|
@index.when(method='summary', template='json')
|
|
def summary(self):
|
|
"""Get an agregate of all subcloud status
|
|
|
|
"""
|
|
return self._get_alarm_summary()
|