
All available partitions report their presence periodically. The priority of each partition in terms of assuming mastership is determined by earliest start-time (with a UUID-based tiebreaker in the unlikely event of a time clash). A single partion assumes mastership at any given time, taking responsibility for allocating the alarms to be evaluated across the set of currently available partitions. When a partition lifecycle event is detected (i.e. a pre-existing partition fails to report its presence, or a new one is started up), a complete rebalance of the alarms is initiated. Individual alarm lifecycle events, on the other hand, do not require a full re-balance. Instead new alarms are allocated as they are detected, whereas deleted alarms are initially allowed to remain within the allocation (as the individual evaluators are tolerant of assigned alarms not existing, and the deleted alarms should be randomly distributed over the partions). However once the number of alarms deleted since the last rebalance reaches a certain limit, a rebalance will be initiated to maintain equity. As presence reports are received, each partition keeps track of the oldest partition it currently knows about, allowing an assumption of mastership to be aborted if an older partition belatedly reports. The alarm evaluation service to launch (singleton versus partitioned) is controlled via a new alarm.evaluation_service config option. Implements bp alarm-service-partitioner Change-Id: I3dede464d019a7f776f3d302e2b24cc4a9fc5b66
78 lines
2.7 KiB
Python
78 lines
2.7 KiB
Python
# -*- encoding: utf-8 -*-
|
|
#
|
|
# Copyright © 2013 eNovance <licensing@enovance.com>
|
|
#
|
|
# Authors: Mehdi Abaakouk <mehdi.abaakouk@enovance.com>
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License"); you may
|
|
# not use this file except in compliance with the License. You may obtain
|
|
# a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
# License for the specific language governing permissions and limitations
|
|
# under the License.
|
|
|
|
from oslo.config import cfg
|
|
|
|
from ceilometer.openstack.common import context
|
|
from ceilometer.openstack.common.rpc import proxy as rpc_proxy
|
|
from ceilometer.storage.models import Alarm
|
|
|
|
OPTS = [
|
|
cfg.StrOpt('notifier_rpc_topic',
|
|
default='alarm_notifier',
|
|
help='the topic ceilometer uses for alarm notifier messages'),
|
|
cfg.StrOpt('partition_rpc_topic',
|
|
default='alarm_partition_coordination',
|
|
help='the topic ceilometer uses for alarm partition '
|
|
'coordination messages'),
|
|
]
|
|
|
|
cfg.CONF.register_opts(OPTS, group='alarm')
|
|
|
|
|
|
class RPCAlarmNotifier(rpc_proxy.RpcProxy):
|
|
def __init__(self):
|
|
super(RPCAlarmNotifier, self).__init__(
|
|
default_version='1.0',
|
|
topic=cfg.CONF.alarm.notifier_rpc_topic)
|
|
|
|
def notify(self, alarm, previous, reason):
|
|
actions = getattr(alarm, Alarm.ALARM_ACTIONS_MAP[alarm.state])
|
|
msg = self.make_msg('notify_alarm', data={
|
|
'actions': actions,
|
|
'alarm_id': alarm.alarm_id,
|
|
'previous': previous,
|
|
'current': alarm.state,
|
|
'reason': reason})
|
|
self.cast(context.get_admin_context(), msg)
|
|
|
|
|
|
class RPCAlarmPartitionCoordination(rpc_proxy.RpcProxy):
|
|
def __init__(self):
|
|
super(RPCAlarmPartitionCoordination, self).__init__(
|
|
default_version='1.0',
|
|
topic=cfg.CONF.alarm.partition_rpc_topic)
|
|
|
|
def presence(self, uuid, priority):
|
|
msg = self.make_msg('presence', data={
|
|
'uuid': uuid,
|
|
'priority': priority})
|
|
self.fanout_cast(context.get_admin_context(), msg)
|
|
|
|
def assign(self, uuid, alarms):
|
|
msg = self.make_msg('assign', data={
|
|
'uuid': uuid,
|
|
'alarms': alarms})
|
|
return self.fanout_cast(context.get_admin_context(), msg)
|
|
|
|
def allocate(self, uuid, alarms):
|
|
msg = self.make_msg('allocate', data={
|
|
'uuid': uuid,
|
|
'alarms': alarms})
|
|
return self.fanout_cast(context.get_admin_context(), msg)
|