76c6d465d8
The collector grew from doing one thing to doing too many. This encumber scalability and he's really a bad design as it is. Let's fix that. This patch take out the notification handling code to a new daemon called ceilometer-agent-notification. This daemon will be in charge of receiving notifications, storing them if needed, and building samples in from of it. Change-Id: I093f3b7855bd6ffff2018db9cd485ed2fc0f37a5 Blueprint: split-collector
196 lines
7.1 KiB
Python
196 lines
7.1 KiB
Python
# -*- encoding: utf-8 -*-
|
|
#
|
|
# Copyright © 2012-2013 eNovance <licensing@enovance.com>
|
|
#
|
|
# Author: Julien Danjou <julien@danjou.info>
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License"); you may
|
|
# not use this file except in compliance with the License. You may obtain
|
|
# a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
# License for the specific language governing permissions and limitations
|
|
# under the License.
|
|
|
|
from oslo.config import cfg
|
|
from stevedore import extension
|
|
|
|
from ceilometer.openstack.common import context
|
|
from ceilometer.openstack.common import log
|
|
from ceilometer.openstack.common.rpc import service as rpc_service
|
|
from ceilometer.openstack.common import service as os_service
|
|
from ceilometer.openstack.common import timeutils
|
|
from ceilometer import pipeline
|
|
from ceilometer import service
|
|
from ceilometer.storage import models
|
|
from ceilometer import transformer
|
|
|
|
|
|
LOG = log.getLogger(__name__)
|
|
|
|
|
|
OPTS = [
|
|
cfg.BoolOpt('ack_on_event_error',
|
|
default=True,
|
|
deprecated_group='collector',
|
|
help='Acknowledge message when event persistence fails'),
|
|
cfg.BoolOpt('store_events',
|
|
deprecated_group='collector',
|
|
default=False,
|
|
help='Save event details'),
|
|
]
|
|
|
|
cfg.CONF.register_opts(OPTS, group="notification")
|
|
|
|
|
|
class UnableToSaveEventException(Exception):
|
|
"""Thrown when we want to requeue an event.
|
|
|
|
Any exception is fine, but this one should make debugging
|
|
a little easier.
|
|
"""
|
|
|
|
|
|
class NotificationService(service.DispatchedService, rpc_service.Service):
|
|
|
|
NOTIFICATION_NAMESPACE = 'ceilometer.notification'
|
|
|
|
def start(self):
|
|
super(NotificationService, self).start()
|
|
# Add a dummy thread to have wait() working
|
|
self.tg.add_timer(604800, lambda: None)
|
|
|
|
def initialize_service_hook(self, service):
|
|
'''Consumers must be declared before consume_thread start.'''
|
|
self.pipeline_manager = pipeline.setup_pipeline(
|
|
transformer.TransformerExtensionManager(
|
|
'ceilometer.transformer',
|
|
),
|
|
)
|
|
|
|
self.notification_manager = \
|
|
extension.ExtensionManager(
|
|
namespace=self.NOTIFICATION_NAMESPACE,
|
|
invoke_on_load=True,
|
|
)
|
|
|
|
if not list(self.notification_manager):
|
|
LOG.warning('Failed to load any notification handlers for %s',
|
|
self.NOTIFICATION_NAMESPACE)
|
|
self.notification_manager.map(self._setup_subscription)
|
|
|
|
def _setup_subscription(self, ext, *args, **kwds):
|
|
"""Connect to message bus to get notifications
|
|
|
|
Configure the RPC connection to listen for messages on the
|
|
right exchanges and topics so we receive all of the
|
|
notifications.
|
|
|
|
Use a connection pool so that multiple notification agent instances
|
|
can run in parallel to share load and without competing with each
|
|
other for incoming messages.
|
|
|
|
"""
|
|
handler = ext.obj
|
|
ack_on_error = cfg.CONF.notification.ack_on_event_error
|
|
LOG.debug('Event types from %s: %s (ack_on_error=%s)',
|
|
ext.name, ', '.join(handler.event_types),
|
|
ack_on_error)
|
|
|
|
for exchange_topic in handler.get_exchange_topics(cfg.CONF):
|
|
for topic in exchange_topic.topics:
|
|
try:
|
|
self.conn.join_consumer_pool(
|
|
callback=self.process_notification,
|
|
pool_name=topic,
|
|
topic=topic,
|
|
exchange_name=exchange_topic.exchange,
|
|
ack_on_error=ack_on_error)
|
|
except Exception:
|
|
LOG.exception('Could not join consumer pool %s/%s' %
|
|
(topic, exchange_topic.exchange))
|
|
|
|
def process_notification(self, notification):
|
|
"""RPC endpoint for notification messages
|
|
|
|
When another service sends a notification over the message
|
|
bus, this method receives it. See _setup_subscription().
|
|
|
|
"""
|
|
LOG.debug('notification %r', notification.get('event_type'))
|
|
self.notification_manager.map(self._process_notification_for_ext,
|
|
notification=notification)
|
|
|
|
if cfg.CONF.notification.store_events:
|
|
self._message_to_event(notification)
|
|
|
|
@staticmethod
|
|
def _extract_when(body):
|
|
"""Extract the generated datetime from the notification.
|
|
"""
|
|
when = body.get('timestamp', body.get('_context_timestamp'))
|
|
if when:
|
|
return timeutils.normalize_time(timeutils.parse_isotime(when))
|
|
|
|
return timeutils.utcnow()
|
|
|
|
def _message_to_event(self, body):
|
|
"""Convert message to Ceilometer Event.
|
|
|
|
NOTE: this is currently based on the Nova notification format.
|
|
We will need to make this driver-based to support other formats.
|
|
|
|
NOTE: the rpc layer currently rips out the notification
|
|
delivery_info, which is critical to determining the
|
|
source of the notification. This will have to get added back later.
|
|
"""
|
|
message_id = body.get('message_id')
|
|
event_type = body['event_type']
|
|
when = self._extract_when(body)
|
|
LOG.debug('Saving event "%s"', event_type)
|
|
|
|
publisher = body.get('publisher_id')
|
|
request_id = body.get('_context_request_id')
|
|
tenant_id = body.get('_context_tenant')
|
|
|
|
text = models.Trait.TEXT_TYPE
|
|
all_traits = [models.Trait('service', text, publisher),
|
|
models.Trait('request_id', text, request_id),
|
|
models.Trait('tenant_id', text, tenant_id),
|
|
]
|
|
# Only store non-None value traits ...
|
|
traits = [trait for trait in all_traits if trait.value is not None]
|
|
|
|
event = models.Event(message_id, event_type, when, traits)
|
|
|
|
problem_events = []
|
|
for dispatcher in self.dispatcher_manager:
|
|
problem_events.extend(dispatcher.obj.record_events(event))
|
|
if models.Event.UNKNOWN_PROBLEM in [x[0] for x in problem_events]:
|
|
# Don't ack the message, raise to requeue it
|
|
# if ack_on_error = False
|
|
raise UnableToSaveEventException()
|
|
|
|
def _process_notification_for_ext(self, ext, notification):
|
|
"""Wrapper for calling pipelines when a notification arrives
|
|
|
|
When a message is received by process_notification(), it calls
|
|
this method with each notification plugin to allow all the
|
|
plugins process the notification.
|
|
|
|
"""
|
|
with self.pipeline_manager.publisher(context.get_admin_context()) as p:
|
|
# FIXME(dhellmann): Spawn green thread?
|
|
p(list(ext.obj.to_samples(notification)))
|
|
|
|
|
|
def agent():
|
|
service.prepare_service()
|
|
os_service.launch(NotificationService(
|
|
cfg.CONF.host,
|
|
'ceilometer.agent.notification')).wait()
|